python实现大文件切割操作

前提是你 提交于 2019-12-10 08:53:37
import os
import time


def mkSubFile(lines, srcName, sub):
    [des_filename, extname] = os.path.splitext(srcName)
    filename = des_filename + '_' + str(sub) + extname
    print 'make file: %s' % filename
    fout = open(filename, 'w')
    try:
        fout.writelines(lines)
        return sub + 1
    finally:
        fout.close()


def splitByLineCount(filename, count):
    with open(filename, 'rb') as fin:
        try:
            head = fin.readline()
            buf = []
            sub = 1
            buf.append(head)
            for line in fin:
                buf.append(line)
                if len(buf) == count:
                    sub = mkSubFile(buf, filename, sub)
                    buf = []
            if len(buf) != 0:
                sub = mkSubFile(buf, filename, sub)
        finally:
            fin.close()


if __name__ == '__main__':
    # 每个文件存储40000行数据
    begin = time.time()
    splitByLineCount('/home/python/Desktop/sum.txt', 40000)
    end = time.time()
    print('time is %d seconds ' % (end - begin))

 

标签
易学教程内所有资源均来自网络或用户发布的内容,如有违反法律规定的内容欢迎反馈
该文章没有解决你所遇到的问题?点击提问,说说你的问题,让更多的人一起探讨吧!