import pandas as pd
import numpy as np
import os
def split_excel():
# 请求用户输入Excel文件路径和拆分数量
file_path = input("请输入Excel文件的完整路径:")
x = int(input("请输入您想要拆分的份数:"))
# 确保文件存在
if not os.path.exists(file_path):
print("文件不存在,请检查路径是否正确。")
return
# 读取Excel文件
try:
data = pd.read_excel(file_path)
except Exception as e:
print(f"读取Excel文件时发生错误:{e}")
return
# 将数据转换为一列并删除空白单元格
flattened_data = pd.Series(data.values.flatten()).dropna()
# 创建新的DataFrame
single_column_df = pd.DataFrame(flattened_data, columns=['数据'])
# 获取原文件名和目录
dir_name, base_name = os.path.split(file_path)
new_file_name = os.path.splitext(base_name)[0] + "单列.xlsx"
new_file_path = os.path.join(dir_name, new_file_name)
# 将新的DataFrame写入新的Excel文件
single_column_df.to_excel(new_file_path, index=False)
print(f"新文件已保存至:{new_file_path}")
# 拆分DataFrame为x份并保存
num_rows = len(single_column_df)
rows_per_file = np.ceil(num_rows / x).astype(int)
for i in range(x):
start_index = i * rows_per_file
end_index = min(start_index + rows_per_file, num_rows)
part_df = single_column_df.iloc[start_index:end_index]
part_file_name = os.path.splitext(new_file_name)[0] + f"({i+1}).xlsx"
part_file_path = os.path.join(dir_name, part_file_name)
part_df.to_excel(part_file_path, index=False)
print(f"拆分文件 {i+1} 已保存至:{part_file_path}")
if __name__ == "__main__":
split_excel()