python将一个大型csv分割成多个大小一样的小型csv(音频事件检测)
按行进行分割, 每128行产生一个新的csv文件。
import csv
import os
path = '../development (4).csv'
workspace = '../workspace'
with open(path, 'r', newline='') as file:
csvreader = csv.reader(file)
a = next(csvreader)
print(a)
i = j = 0
for row in csvreader:
print(row)
print(f'i is {i}, j is {j}')
# 每128个就j加1, 然后就有一个新的文件名
if i % 128 == 0:
j += 1
print(f"csv {j} 生成成功")
#csv_path = os.path.join('../new_csv_file/', 'development (4)/' + str(j) + '.csv')
csv_path = os.path.join(workspace, 'part_{}.csv'.format(j))
# print('/'.join(path.split('/')[:-1]))
print(csv_path)
# 不存在此文件的时候,就创建
if not os.path.exists(os.path.dirname(csv_path)):
os.makedirs(os.path.dirname(csv_path))
with open(csv_path, 'w', newline='') as file:
csvwriter = csv.writer(file)
#csvwriter.writerow(['image_url'])
csvwriter.writerow(row)
i += 1
# 存在的时候就往里面添加
else:
with open(csv_path, 'a', newline='') as file:
csvwriter = csv.writer(file)
csvwriter.writerow(row)
i += 1
分割后的效果: