84 lines
2.5 KiB
Python
Raw Normal View History

2020-04-22 12:56:21 -04:00
import os
import re
STOP_RECURSING = 23452
class VisitFiles:
"""
This is a helper class to visit a bunch of files in a tree given
the regular expressions that will match the filenames you're interested in.
Create this class like a function, and pass in these parameters:
baseDir - a string for the root directory in the search. This must not end in a slash.
fileMasks - a list of strings that contain regular expressions for filenames you want to match.
fileCB - This function is called for each filename matched. It takes these parameters:
- short filename ("blah.txt")
- relative filename ("a/b/c/blah.txt")
- long filename ("c:/basedir/a/b/c/blah.txt")
dirCB - a function called for each directory name. This can be None. If it returns STOP_RECURSING,
then it won't do callbacks for the files and directories under this one.
- relative dirName ("./a/b")
- full dirname (from the baseDir you pass into __init__) ("d:/a/b")
bRecurse - a boolean telling whether or not to recurse into other directories.
Example: This would visit all files recursively (.+ matches any non-zero-length string).
VisitFiles( ".", [".+"], MyCallback )
"""
def __init__( self, baseDir, fileMasks, fileCB, dirCB, bRecurse=1 ):
# Handle it appropriately whether they pass 1 filemask or a list of them.
if isinstance( fileMasks, list ):
self.fileMasks = [re.compile( x, re.IGNORECASE ) for x in fileMasks]
else:
self.fileMasks = [re.compile( fileMasks, re.IGNORECASE )]
self.fileCB = fileCB
self.dirCB = dirCB
self.bRecurse = bRecurse
self.__VisitFiles_R( ".", baseDir )
def __RemoveDotSlash( self, name ):
if name[0:2] == '.\\':
return name[2:]
else:
return name
def __VisitFiles_R( self, relativeDirName, baseDirName ):
if self.dirCB:
if self.dirCB( relativeDirName, baseDirName ) == 0:
return
files = os.listdir( baseDirName )
for filename in files:
upperFilename = filename.upper()
fullFilename = self.__RemoveDotSlash( baseDirName + "\\" + filename )
relativeName = self.__RemoveDotSlash( relativeDirName + "\\" + filename )
stats = os.stat( fullFilename )
if stats[0] & (1<<15):
matched = 0
for curRE in self.fileMasks:
if curRE.search( upperFilename ):
matched = 1
break
if matched:
self.fileCB( filename, relativeName, fullFilename )
else:
# It's a directory.
if self.bRecurse:
self.__VisitFiles_R( relativeName, fullFilename )