例子1 指定分割文件大小
配置文件 config.ini
[global]
#原文件存放目录
dir1=F:\work\python\3595\pyserver\test
#新文件存放目录
dir2=F:\work\python\3595\pyserver\test1
python 代码
代码如下 | 复制代码 |
#!/usr/bin/python # -*- coding: utf-8 -*- import os,sys,ConfigParser class file_openate(object): def __init__(self): #初如化读取数据库配置 dir_config = ConfigParser.ConfigParser() file_config=open('config.ini',"rb") dir_config.readfp(file_config) self.dir1=str(dir_config.get("global","dir1")) self.dir1=unicode(self.dir1,'utf8') self.dir2=str(dir_config.get("global","dir2")) self.dir2=unicode(self.dir2,'utf8') file_config.close() #print self.dir2 #self.dir1="F:\\work\\python\\3595\\pyserver\\test" def file_list(self): input_name_han="软件有不确认性,前期使用最好先备份,以免发生数据丢失,确认备份后,请输入要分割的字节大小,按b来计算".decode('utf-8') print input_name_han while 1: input_name=raw_input("number:") if input_name.isdigit(): input_name=int(input_name) os.chdir(self.dir1) for filename in os.listdir(self.dir1): os.chdir(self.dir1) #print filename name, ext = os.path.splitext(filename) file_size=int(os.path.getsize(filename)) f=open(filename,'r') chu_nmuber=0 while file_size >= 1: #print file_size chu_nmuber=chu_nmuber + 1 if file_size >= input_name: file_size=file_size - input_name a=f.read(input_name) os.chdir(self.dir2) filename1=name + '-' + str(chu_nmuber) + ext new_f=open(filename1,'a') new_f.write(a) new_f.close() #print file_size else: a=f.read() os.chdir(self.dir2) filename1=name + '-' + str(chu_nmuber) + ext new_f=open(filename1,'a') new_f.write(a) new_f.close() break print "分割成功".decode('utf-8') + filename f.close() else: print "请输入正确的数字,请重新输入".decode('utf-8') file_name=file_openate() |
例子,按行分割文件大小
代码如下 | 复制代码 |
#!/usr/bin/env python #--*-- coding:utf-8 --*-- import os class SplitFiles(): def __init__(self, file_name, line_count=200): def split_file(self): except IOError as err: def get_part_file_name(self, part_num): def write_file(self, part_num, *line_content): if __name__ == "__main__": |
上面只是进行了分割了,如果我们又要合并怎么办呢?下面这个例子可以实现分割与合并哦,大家一起看看。
例子 分割文件与合并函数
代码如下 | 复制代码 |
#!/usr/bin/python ########################################################################## # split a file into a set of parts; join.py puts them back together; # this is a customizable version of the standard unix split command-line # utility; because it is written in Python, it also works on Windows and # can be easily modified; because it exports a function, its logic can # also be imported and reused in other applications; ########################################################################## import sys, os kilobytes = 1024 megabytes = kilobytes * 1000 chunksize = int(1.4 * megabytes) # default: roughly a floppy def split(fromfile, todir, chunksize=chunksize): if not os.path.exists(todir): # caller handles errors os.mkdir(todir) # make dir, read/write parts else: for fname in os.listdir(todir): # delete any existing files os.remove(os.path.join(todir, fname)) partnum = 0 input = open(fromfile, 'rb') # use binary mode on Windows while 1: # eof=empty string from read chunk = input.read(chunksize) # get next part <= chunksize if not chunk: break partnum = partnum+1 filename = os.path.join(todir, ('part%04d' % partnum)) fileobj = open(filename, 'wb') fileobj.write(chunk) fileobj.close() # or simply open().write() input.close() assert partnum <= 9999 # join sort fails if 5 digits return partnum if __name__ == '__main__': if len(sys.argv) == 2 and sys.argv[1] == '-help': print 'Use: split.py [file-to-split target-dir [chunksize]]' else: if len(sys.argv) < 3: interactive = 1 fromfile = raw_input('File to be split? ') # input if clicked todir = raw_input('Directory to store part files? ') else: interactive = 0 fromfile, todir = sys.argv[1:3] # args in cmdline if len(sys.argv) == 4: chunksize = int(sys.argv[3]) absfrom, absto = map(os.path.abspath, [fromfile, todir]) print 'Splitting', absfrom, 'to', absto, 'by', chunksize try: parts = split(fromfile, todir, chunksize) except: print 'Error during split:' print sys.exc_info()[0], sys.exc_info()[1] else: print 'Split finished:', parts, 'parts are in', absto if interactive: raw_input('Press Enter key') # pause if clicked join_file.py #!/usr/bin/python ########################################################################## # join all part files in a dir created by split.py, to recreate file. # This is roughly like a 'cat fromdir/* > tofile' command on unix, but is # more portable and configurable, and exports the join operation as a # reusable function. Relies on sort order of file names: must be same # length. Could extend split/join to popup Tkinter file selectors. ########################################################################## import os, sys readsize = 1024 def join(fromdir, tofile): output = open(tofile, 'wb') parts = os.listdir(fromdir) parts.sort() for filename in parts: filepath = os.path.join(fromdir, filename) fileobj = open(filepath, 'rb') while 1: filebytes = fileobj.read(readsize) if not filebytes: break output.write(filebytes) fileobj.close() output.close() if __name__ == '__main__': if len(sys.argv) == 2 and sys.argv[1] == '-help': print 'Use: join.py [from-dir-name to-file-name]' else: if len(sys.argv) != 3: interactive = 1 fromdir = raw_input('Directory containing part files? ') tofile = raw_input('Name of file to be recreated? ') else: interactive = 0 fromdir, tofile = sys.argv[1:] absfrom, absto = map(os.path.abspath, [fromdir, tofile]) print 'Joining', absfrom, 'to make', absto try: join(fromdir, tofile) except: print 'Error joining files:' print sys.exc_info()[0], sys.exc_info()[1] else: print 'Join complete: see', absto if interactive: raw_input('Press Enter key') # pause if clicked |