清华大佬耗费三个月吐血整理的几百G的资源,免费分享!....>>>
#! /usr/bin/python # -*- coding:utf-8 -*- ''' Created on 2013-12-11 @author: Java ''' import os import MySQLdb from db.DbUtil import DbUtil import time import shutil import sys import zipfile from os.path import join,getsize import math class FileOption(): #global fileList 类的全局变量 放置位置 def __init__(self): pass def CreateFloderByList(self,pathList): ''' 创建文件夹 :param pathList:文件夹集合 ''' self.pathList = pathList for path in pathList: if not os.path.isdir(path): os.makedirs(path) def CreateFloder(self,path): self.path = path if not os.path.isdir(path): os.makedirs(path) def readFileName(self,path): fileNames = os.listdir(path) return fileNames def renameFile(self,path): ''' 批量修改文件的名称 :param path: ''' self.path = path allRenameList = os.listdir(path) for allRenameItem in allRenameList: renamePath =os.path.join(path,allRenameItem) if os.path.isfile(renamePath)==True: print allRenameItem if allRenameItem.find('.')<0: newname = allRenameItem+'index.html' os.renames(os.path.join(path,allRenameItem), os.path.join(path,newname)) print allRenameItem,'ok' else: os.renames(os.path.join(path,allRenameItem), os.path.join(path,'index.html')) print allRenameItem,'ok' def renameFile2(self,path,newName): ''' 批量修改文件名称,解决了中文文件名称的问题 :param path:路径 :param newName:新名称 ''' allRenameList = os.listdir(path) for allRenameItem in allRenameList: renamePath =os.path.join(path,allRenameItem) if sys.getfilesystemencoding()=='mbcs': renamePath=renamePath.decode('mbcs') print renamePath elif sys.getfilesystemencoding() & 0x800: renamePath=renamePath.decode('utf-8') # print renamePath if os.path.isfile(renamePath)==True: if sys.getfilesystemencoding()=='mbcs': allRenameItem=allRenameItem.decode('mbcs') elif sys.getfilesystemencoding() & 0x800: allRenameItem=allRenameItem.decode('utf-8') if allRenameItem.find('.')<0: newname = allRenameItem+newName os.renames(os.path.join(path,allRenameItem), os.path.join(path,newname)) print allRenameItem,'ok' else: os.renames(os.path.join(path,allRenameItem), os.path.join(path,newName)) print allRenameItem,'ok' else: option = FileOption() option.renameFile2(renamePath,newName) def IteratrFolder(self,testpath): ''' 遍历文件夹 并且解决了中文文件名的问题 查看系统文件名编码 sys.getfilesystemencoding() :param path: ''' listsubDir=[] list = os.listdir(testpath) for filename in list: if sys.getfilesystemencoding()=='mbcs': filename=filename.decode('mbcs') paths = os.path.join(testpath,filename) if os.path.isdir(paths): listSub = os.listdir(paths) for sub in listSub: subDir = os.path.join(paths,sub) listsubDir.append(subDir) return listsubDir def RemoveFilesByFileType(self,path,fileType): ''' 批量删除指定文件夹下指定文件类型的文件 :param path:路径 :param fileType:文件类型 ''' fileList = os.listdir(path) for one in fileList: print one removePath =os.path.join(path,one) if os.path.isfile(removePath)==True: if removePath.find(fileType)>=0: os.remove(removePath) def isSubString(self,subStrList,string): ''' 判断 字符串Str是否包含序列subStrList 中的每一个子字符串 subStrList =['py','java','txt'] string = 'nihaojavaandpython.txt' isSubString(subStrList,string) reutn Treu(or False) ''' flag = True for substr in subStrList: if not (substr in string): flag = False return flag def getFileSuffix(self,filePath): ''' 得到所有文件的后缀名,用系统的函数os.path.splitext ''' try: for (dirPath,dirs,files) in os.walk(filePath): for filename in files: ext = os.path.splitext(filename)[1] #取得文件类型,注意它还带着点号 print ext except os.error,e: print 'error e'%e def getFileListBySuffix(self,filePath,fileList,suffixStr=[]): ''' 获取目录中指定的后缀名的文件 (自己写的方法) ''' fileNames = os.listdir(filePath) for fileName in fileNames: findPath = os.path.join(filePath, fileName) if os.path.isfile(findPath): if (len(fileNames)>0): if(len(suffixStr)>0): #返回指定类型的文件名 option = FileOption() if (option.isSubString(suffixStr,fileName)): fullFileName = os.path.join(filePath,fileName) fileList.append(fullFileName) elif os.path.isdir(findPath): option = FileOption() option.getFileListBySuffix(findPath,fileList,suffixStr) #对文件名排序 if (len(fileList)>0): fileList.sort() return fileList def getFileListBySuffix_Better(self,filePath,fileList,suffixStr=[]): ''' 获取目录中指定的后缀名的文件 (自己写的方法速度更快) ''' for (dirPath,dirs,files) in os.walk(filePath): for filename in files: if (len(files)>0): if(len(suffixStr)>0): #返回指定类型的文件名 option = FileOption() if (option.isSubString(suffixStr,filename)): fullFileName = os.path.join(filePath,filename) fileList.append(fullFileName) #对文件名排序 if (len(fileList)>0): fileList.sort() return fileList def getFileListBySuffix_Best(self,filePath,fileList,suffixStr=[]): ''' 获取目录中指定的后缀名的文件 (自己写的方法速度更快) ''' for (dirPath,dirs,files) in os.walk(filePath): for filename in files: if (len(files)>0): if(len(suffixStr)>0): #返回指定类型的文件名 for suf in suffixStr: if os.path.splitext(filename)[1].find (suf)==0: fullFileName = os.path.join(dirPath,filename) fileList.append(fullFileName) #对文件名排序 if (len(fileList)>0): fileList.sort() return fileList def copyFiles(self,sourceDir, targetDir): ''' 实现对文件的拷贝 ''' for file in os.listdir(sourceDir): sourceFile = os.path.join(sourceDir, file) targetFile = os.path.join(targetDir, file) if os.path.isfile(sourceFile): if not os.path.exists(targetDir): os.makedirs(targetDir) if not os.path.exists(targetFile) or(os.path.exists(targetFile) and (os.path.getsize(targetFile) != os.path.getsize(sourceFile))): open(targetFile, "wb").write(open(sourceFile, "rb").read()) if os.path.isdir(sourceFile): First_Directory = False create = FileOption() create.copyFiles(sourceFile, targetFile) def moveFiles(self,dir,extName): ''' :param dir:原始数据目录 :param extName:文件的扩展名 根据文件名创建文件夹,并将其放入对应的文件夹内 ''' self.dir = dir self.extName = extName for i in os.listdir(dir): name = ''.join(i.split(extName)[0:-1]) print name os.mkdir(os.path.join(dir,name)) os.rename(os.path.join(dir,i), os.path.join(dir,name,i)) def moveDirAndFiles(self,oldPath,newPath): ''' 实现对指定文件的迁移 :param oldPath:源路径 :param newPath:目的路径 ''' self.oldPath = oldPath self.newPath = newPath try: allChangeFileList = os.listdir(oldPath) for allChangeItem in allChangeFileList: changeFilePath =os.path.join(oldPath,allChangeItem) if os.path.isdir(changeFilePath): dstAddPath = os.path.join(newPath,allChangeItem) if os.path.exists(dstAddPath): moveFiles = FileOption() moveFiles.moveDirAndFiles(oldPath,dstAddPath) else: os.makedirs(newPath) os.rename(oldPath,newPath) else: shutil.move(oldPath,newPath) return True except os.errno,e: print 'error e%s'%e # def moveDirAndFiles_Better(self,oldPath,newPath): # ''' # 实现对指定文件的迁移 # :param oldPath:源路径 # :param newPath:目的路径 # ''' # self.oldPath = oldPath # self.newPath = newPath # try: # for (dirPath,dirs,files) in os.walk(oldPath): # for filename in files: # dstPath = os.path.join(dirPath,filename) # print dstPath # if os.path.exists(dstPath): # shutil.move(oldPath,newPath) # else: # os.makedirs(newPath) # os.rename(oldPath,newPath) # except os.errno,e: # print 'error e%s'%e def TraverseFolder(self,path): ''' 遍历文件夹 :param path: ''' self.path = path print "<----folder&file---->" no=0 for (path,dirs,files) in os.walk(path): print no += 1 print "No.%d"%no print "path=%s"%path if len(dirs)!=0: # print type(dirs) subfolders = '' for dir in dirs: subfolders += dir+';' subfolders = '[' + subfolders + ']' print "subfolders=%s"%subfolders if len(files)!=0: filenames = '' for filename in files: filenames += filename+';' filenames = '[' + filenames + ']' print "files=%s"%filenames print "<----folder&file---->" def renameExpendNameOfFile(self,path,oldexp_name,newexp_name): ''' :param path:路径 :param oldexp_name:旧的扩展名 :param newexp_name:新的扩展名 ''' self.path = path self.oldexp_name = oldexp_name self.newexp_name = newexp_name changedCount = 0 for (path,dirs,files) in os.walk(path): for filename in files: ext = os.path.splitext(filename)[1] #取得文件类型,注意它还带着点号 if (ext == oldexp_name): changedCount += 1 newname = filename.replace(oldexp_name, newexp_name) oldpath = path + "\\" + filename newpath = path + "\\" + newname try: os.rename(oldpath, newpath) print 'No.%d'%changedCount, 'change', oldpath, 'to', newpath except BaseException, e: print(str(e)) def renameExpendNameOfFile2(self): ''' 修改文件的后缀名,有控制台输入参数 ''' str = u'请输入要处理的文件夹路径====>' path = raw_input(str.encode('utf-8')) print path str = u'请输入源文件类型(不包括.)====>' old_ext = "."+raw_input(str.encode('utf-8')) print old_ext str = u'请输入目标文件类型(不包括.)====>' new_ext = "."+raw_input(str.encode('utf-8')) print new_ext print #输出空行占位 f = FileOption() f.TraverseFolder(path) print str = u'开始批量更名' print str print '<-----------------' changedCount = 0 for (path,dirs,files) in os.walk(path): for filename in files: ext = os.path.splitext(filename)[1] #取得文件类型,注意它还带着点号 if (ext == old_ext): changedCount += 1 newname = filename.replace(old_ext, new_ext) oldpath = path + "\\" + filename newpath = path + "\\" + newname try: os.rename(oldpath, newpath) print 'No.%d'%changedCount, 'change', oldpath, 'to', newpath except BaseException, e: print(str(e)) print '----------------->' def deleteFolder(self,path): ''' 删除指定目录下的文件 :param path: ''' self.path = path for root ,dirs,files in os.walk(path, False): for name in files: os.remove(os.path.join(root,name)) for name in dirs: os.rmdir(os.path.join(root,name)) def remove_empty_dir(self,path): ''' 删除目录下所有的空文件夹 :param path: ''' self.path = path while(path[-1] == "\\"): path = path[:-1] print path a = {} for root, dirs, files in os.walk(path, False): print dirs if len(files) == 0: a[root] = 0 else: for file in files: try: fn = os.path.join(root, file) size = os.path.getsize(fn) if size != 0: b = root while(b != path): a[b] = 1 b = b.rpartition("\\")[0] a[path] = 1 else: try: os.remove(fn) a[root] = 0 except (WindowsError): b = root while(b != path): a[b] = 1 b = b.rpartition("\\")[0] a[path] = 1 except (WindowsError): b = root while(b != path): a[b] = 1 b = b.rpartition("\\")[0] a[path] = 1 if a[root]: break; empty_dirs = [] for i,j in a.iteritems(): if j == 0: print i empty_dirs.insert(0, i) del a empty_dirs.sort(reverse = True) for i in empty_dirs: try: os.rmdir(i) print "%s 删掉了!!" % (i) except (WindowsError): print "%s 删不掉!!" % (i) def zipAllFiles(self,startdir,zipPath): ''' 实现批量压缩文件 :param startdir: 压缩包的层次 比如download.zip解压开是:download/1/1.html 所以startdir 就是‘f:/download/’ :param zipPath: download/1/ 文件的上次层次 ''' self.startdir = startdir self.zipPath = zipPath for dirpath, dirnames, filenames in os.walk(startdir): for filename in filenames: newp = dirpath+'\\' if newp.find('F:'+zipPath)==0: print os.path.join(newp,filename) # f = zipfile.ZipFile('F:\pythonTest\zipTest\\'+'download'+str(DownID)+'.zip','a',zipfile.ZIP_DEFLATED) # f.write(os.path.join(newp,filename)) # print os.path.join(newp,filename) # f.close() def getAllFileSize(self,path,size): ''' 得到整个文件所在文件夹的大小 1B = 8 bit 1KB = 1024 B 1MB = 1024 KB 1MB = 1024*1024 B 1GB = 1024 MB :param path: ''' self.path = path for dirpath,dirs,files in os.walk(path): size += sum([getsize(join(dirpath,name)) for name in files]) return size def getFileSize(self,path): ''' 得到每个文件的大小,以字典方式存入list中 :param path: ''' self.path = path sizeDic={} sizeList = [] for dirpath,dirs,files in os.walk(path): for file in files: fileSize = getsize(join(dirpath,file)) sizeDic={file:fileSize} sizeList.append(sizeDic) return sizeList if __name__=='__main__': db = DbUtil() create =FileOption() size1 = create.getFileSize('F:\\pythonTest\\delete\\')