python实现数据分裂sheet
import pandas as pd
file_path = 'C:\Users\pc\Desktop\record.xlsx'
output_path = 'C:\Users\pc\Desktop\distributed_data.xlsx'
sheet_name = '1000'
df = pd.read_excel(file_path, sheet_name=sheet_name, engine='openpyxl')
df_shuffled = df.sample(frac=1, random_state=42)
num_sheets = 3
total_rows = len(df_shuffled)
rows_per_sheet = total_rows // num_sheets
remainder = total_rows % num_sheets
writer = pd.ExcelWriter(output_path, engine='openpyxl')
df_shuffled.to_excel(writer, sheet_name='Original', index=False)
start_row = 0
for sheet_index in range(num_sheets):
end_row = start_row + rows_per_sheet
if sheet_index < remainder:
end_row += 1
df_shuffled.iloc[start_row:end_row].to_excel(writer, sheet_name=f'Sheet_{sheet_index + 1}', index=False)
start_row = end_row
writer.save()