时间:2020-12-23 11:37:22 | 栏目:Python代码 | 点击:次
本文实例为大家分享了python实现按行分割文件的具体代码,供大家参考,具体内容如下
#!/usr/bin/env python #--*-- coding:utf-8 --*-- import os class SplitFiles(): """按行分割文件""" def __init__(self, file_name, line_count=200): """初始化要分割的源文件名和分割后的文件行数""" self.file_name = file_name self.line_count = line_count def split_file(self): if self.file_name and os.path.exists(self.file_name): try: with open(self.file_name) as f : # 使用with读文件 temp_count = 0 temp_content = [] part_num = 1 for line in f: if temp_count < self.line_count: temp_count += 1 else : self.write_file(part_num, temp_content) part_num += 1 temp_count = 1 temp_content = [] temp_content.append(line) else : # 正常结束循环后将剩余的内容写入新文件中 self.write_file(part_num, temp_content) except IOError as err: print(err) else: print("%s is not a validate file" % self.file_name) def get_part_file_name(self, part_num): """"获取分割后的文件名称:在源文件相同目录下建立临时文件夹temp_part_file,然后将分割后的文件放到该路径下""" temp_path = os.path.dirname(self.file_name) # 获取文件的路径(不含文件名) part_file_name = temp_path + "temp_part_file" if not os.path.exists(temp_path) : # 如果临时目录不存在则创建 os.makedirs(temp_path) part_file_name += os.sep + "temp_file_" + str(part_num) + ".part" return part_file_name def write_file(self, part_num, *line_content): """将按行分割后的内容写入相应的分割文件中""" part_file_name = self.get_part_file_name(part_num) print(line_content) try : with open(part_file_name, "w") as part_file: part_file.writelines(line_content[0]) except IOError as err: print(err) if __name__ == "__main__": sf = SplitFiles(r"F:\multiple_thread_read_file.txt") sf.split_file()
小编再为大家分享一段代码:
将文本文件按照指定的行数分割成数个小的文本文件
#! /usr/bin/env python # -*- coding: utf-8 -*- LIMIT=1000 file_count=0 url_list=[] with open("123.txt") as f: for line in f: url_list.append(line) if len(url_list)<LIMIT: continue #数据达到LIMIT file_name=str(file_count)+".txt" with open(file_name,'w') as file: for url in url_list[:-1]: #print(url) file.write(url) file.write(url_list[-1].strip()) url_list=[] file_count+=1 if url_list: file_name=str(file_count)+".txt" with open(file_name,'w') as file: for url in url_list: file.write(url) print('done')