本文大家整理了一些比較好用的關于python分割文件的方法,方法非常的簡單實用。分享給大家供大家參考。具體如下:
例子1 指定分割文件大小
配置文件 config.ini:
#原文件存放目錄
dir1=F:\work\python\3595\pyserver\test
#新文件存放目錄
dir2=F:\work\python\3595\pyserver\test1
python 代碼如下:
# -*- coding: utf-8 -*-
import os,sys,ConfigParser
class file_openate(object):
def __init__(self):
??? #初如化讀取數(shù)據(jù)庫配置
??? dir_config = ConfigParser.ConfigParser()
??? file_config=open('config.ini',"rb")
??? dir_config.readfp(file_config)
??? self.dir1=str(dir_config.get("global","dir1"))
??? self.dir1=unicode(self.dir1,'utf8')
??? self.dir2=str(dir_config.get("global","dir2"))
??? self.dir2=unicode(self.dir2,'utf8')
??? file_config.close()
#print self.dir2
#self.dir1="F:\\work\\python\\3595\\pyserver\\test"
def file_list(self):
??? input_name_han="軟件有不確認性,前期使用最好先備份,以免發(fā)生數(shù)據(jù)丟失,確認備份后,請輸入要分割的字節(jié)大小,按b來計算".decode('utf-8')
??? print input_name_han
??? while 1:
input_name=raw_input("number:")
if input_name.isdigit():
??? input_name=int(input_name)
??? os.chdir(self.dir1)
??? for filename in os.listdir(self.dir1):
os.chdir(self.dir1)
#print filename
name, ext = os.path.splitext(filename)
file_size=int(os.path.getsize(filename))
f=open(filename,'r')
chu_nmuber=0
while file_size >= 1:
??? #print file_size
??? chu_nmuber=chu_nmuber + 1
??? if file_size >= input_name:
file_size=file_size - input_name
a=f.read(input_name)
os.chdir(self.dir2)
filename1=name + '-' + str(chu_nmuber) + ext
new_f=open(filename1,'a')
new_f.write(a)
new_f.close()
#print file_size
??? else:
a=f.read()
os.chdir(self.dir2)
filename1=name + '-' + str(chu_nmuber) + ext
new_f=open(filename1,'a')
new_f.write(a)
new_f.close()
break
print "分割成功".decode('utf-8') + filename
f.close()
else:
??? print "請輸入正確的數(shù)字,請重新輸入".decode('utf-8')
file_name=file_openate()
file_name.file_list()
例子2,按行分割文件大小
#--*-- coding:utf-8 --*--
import os
class SplitFiles():
??? """按行分割文件"""
??? def __init__(self, file_name, line_count=200):
??????? """初始化要分割的源文件名和分割后的文件行數(shù)"""
??????? self.file_name = file_name
??????? self.line_count = line_count
??? def split_file(self):
??????? if self.file_name and os.path.exists(self.file_name):
??????????? try:
??????????????? with open(self.file_name) as f : # 使用with讀文件
??????????????????? temp_count = 0
??????????????????? temp_content = []
??????????????????? part_num = 1
??????????????????? for line in f:
??????????????????????? if temp_count < self.line_count:
??????????????????????????? temp_count += 1
??????????????????????? else :
??????????????????????????? self.write_file(part_num, temp_content)
??????????????????????????? part_num += 1
??????????????????????????? temp_count = 1
??????????????????????????? temp_content = []
??????????????????????? temp_content.append(line)
??????????????????? else : # 正常結束循環(huán)后將剩余的內(nèi)容寫入新文件中
??????????????????????? self.write_file(part_num, temp_content)
??????????? except IOError as err:
??????????????? print(err)
??????? else:
??????????? print("%s is not a validate file" % self.file_name)
??? def get_part_file_name(self, part_num):
??????? """"獲取分割后的文件名稱:在源文件相同目錄下建立臨時文件夾temp_part_file,然后將分割后的文件放到該路徑下"""
??????? temp_path = os.path.dirname(self.file_name) # 獲取文件的路徑(不含文件名)
??????? part_file_name = temp_path + "temp_part_file"
??????? if not os.path.exists(temp_path) : # 如果臨時目錄不存在則創(chuàng)建
??????????? os.makedirs(temp_path)
??????? part_file_name += os.sep + "temp_file_" + str(part_num) + ".part"
??????? return part_file_name
??? def write_file(self, part_num, *line_content):
??????? """將按行分割后的內(nèi)容寫入相應的分割文件中"""
??????? part_file_name = self.get_part_file_name(part_num)
??????? print(line_content)
??????? try :
??????????? with open(part_file_name, "w") as part_file:
??????????????? part_file.writelines(line_content[0])
??????? except IOError as err:
??????????? print(err)
if __name__ == "__main__":
??? sf = SplitFiles(r"F:\multiple_thread_read_file.txt")
??? sf.split_file()
上面只是進行了分割了,如果我們又要合并怎么辦呢?下面這個例子可以實現(xiàn)分割與合并哦,大家一起看看。
例子3, 分割文件與合并函數(shù)
##########################################################################
# split a file into a set of parts; join.py puts them back together;
# this is a customizable version of the standard unix split command-line
# utility; because it is written in Python, it also works on Windows and
# can be easily modified; because it exports a function, its logic can
# also be imported and reused in other applications;
##########################################################################
?????
import sys, os
kilobytes = 1024
megabytes = kilobytes * 1000
chunksize = int(1.4 * megabytes)?? # default: roughly a floppy
?????
def split(fromfile, todir, chunksize=chunksize):
??? if not os.path.exists(todir):? # caller handles errors
os.mkdir(todir)??? # make dir, read/write parts
??? else:
for fname in os.listdir(todir):??? # delete any existing files
??? os.remove(os.path.join(todir, fname))
??? partnum = 0
??? input = open(fromfile, 'rb')?? # use binary mode on Windows
??? while 1:?????? # eof=empty string from read
chunk = input.read(chunksize)????? # get next part <= chunksize
if not chunk: break
partnum? = partnum+1
filename = os.path.join(todir, ('part%04d' % partnum))
fileobj? = open(filename, 'wb')
fileobj.write(chunk)
fileobj.close()??? # or simply open().write()
??? input.close()
??? assert partnum <= 9999 # join sort fails if 5 digits
??? return partnum
????
if __name__ == '__main__':
??? if len(sys.argv) == 2 and sys.argv[1] == '-help':
print 'Use: split.py [file-to-split target-dir [chunksize]]'
??? else:
if len(sys.argv) < 3:
??? interactive = 1
??? fromfile = raw_input('File to be split? ')?????? # input if clicked
??? todir??? = raw_input('Directory to store part files? ')
else:
??? interactive = 0
??? fromfile, todir = sys.argv[1:3]? # args in cmdline
??? if len(sys.argv) == 4: chunksize = int(sys.argv[3])
absfrom, absto = map(os.path.abspath, [fromfile, todir])
print 'Splitting', absfrom, 'to', absto, 'by', chunksize
?????
try:
??? parts = split(fromfile, todir, chunksize)
except:
??? print 'Error during split:'
??? print sys.exc_info()[0], sys.exc_info()[1]
else:
??? print 'Split finished:', parts, 'parts are in', absto
if interactive: raw_input('Press Enter key') # pause if clicked
join_file.py
?
##########################################################################
# join all part files in a dir created by split.py, to recreate file.?
# This is roughly like a 'cat fromdir/* > tofile' command on unix, but is
# more portable and configurable, and exports the join operation as a
# reusable function.? Relies on sort order of file names: must be same
# length.? Could extend split/join to popup Tkinter file selectors.
##########################################################################
?????
import os, sys
readsize = 1024
?????
def join(fromdir, tofile):
??? output = open(tofile, 'wb')
??? parts? = os.listdir(fromdir)
??? parts.sort()
??? for filename in parts:
filepath = os.path.join(fromdir, filename)
fileobj? = open(filepath, 'rb')
while 1:
??? filebytes = fileobj.read(readsize)
??? if not filebytes: break
??? output.write(filebytes)
fileobj.close()
??? output.close()
?????
if __name__ == '__main__':
??? if len(sys.argv) == 2 and sys.argv[1] == '-help':
print 'Use: join.py [from-dir-name to-file-name]'
??? else:
if len(sys.argv) != 3:
??? interactive = 1
??? fromdir = raw_input('Directory containing part files? ')
??? tofile? = raw_input('Name of file to be recreated? ')
else:
??? interactive = 0
??? fromdir, tofile = sys.argv[1:]
absfrom, absto = map(os.path.abspath, [fromdir, tofile])
print 'Joining', absfrom, 'to make', absto
?????
try:
??? join(fromdir, tofile)
except:
??? print 'Error joining files:'
??? print sys.exc_info()[0], sys.exc_info()[1]
else:
?? print 'Join complete: see', absto
if interactive: raw_input('Press Enter key') # pause if clicked
希望本文所述對大家的Python程序設計有所幫助。
更多文章、技術交流、商務合作、聯(lián)系博主
微信掃碼或搜索:z360901061

微信掃一掃加我為好友
QQ號聯(lián)系: 360901061
您的支持是博主寫作最大的動力,如果您喜歡我的文章,感覺我的文章對您有幫助,請用微信掃描下面二維碼支持博主2元、5元、10元、20元等您想捐的金額吧,狠狠點擊下面給點支持吧,站長非常感激您!手機微信長按不能支付解決辦法:請將微信支付二維碼保存到相冊,切換到微信,然后點擊微信右上角掃一掃功能,選擇支付二維碼完成支付。
【本文對您有幫助就好】元
