mirror of
				https://github.com/python/cpython.git
				synced 2025-10-26 08:19:20 +00:00 
			
		
		
		
	 05e8be17fd
			
		
	
	
		05e8be17fd
		
	
	
	
	
		
			
			svn+ssh://pythondev@svn.python.org/python/trunk ........ r60990 | eric.smith | 2008-02-23 17:05:26 +0100 (Sat, 23 Feb 2008) | 1 line Removed duplicate Py_CHARMASK define. It's already defined in Python.h. ........ r60991 | andrew.kuchling | 2008-02-23 17:23:05 +0100 (Sat, 23 Feb 2008) | 4 lines #1330538: Improve comparison of xmlrpclib.DateTime and datetime instances. Remove automatic handling of datetime.date and datetime.time. This breaks backward compatibility, but python-dev discussion was strongly against this automatic conversion; see the bug for a link. ........ r60994 | andrew.kuchling | 2008-02-23 17:39:43 +0100 (Sat, 23 Feb 2008) | 1 line #835521: Add index entries for various pickle-protocol methods and attributes ........ r60995 | andrew.kuchling | 2008-02-23 18:10:46 +0100 (Sat, 23 Feb 2008) | 2 lines #1433694: minidom's .normalize() failed to set .nextSibling for last element. Fix by Malte Helmert ........ r61000 | christian.heimes | 2008-02-23 18:40:11 +0100 (Sat, 23 Feb 2008) | 1 line Patch #2167 from calvin: Remove unused imports ........ r61001 | christian.heimes | 2008-02-23 18:42:31 +0100 (Sat, 23 Feb 2008) | 1 line Patch #1957: syslogmodule: Release GIL when calling syslog(3) ........ r61002 | christian.heimes | 2008-02-23 18:52:07 +0100 (Sat, 23 Feb 2008) | 2 lines Issue #2051 and patch from Alexander Belopolsky: Permission for pyc and pyo files are inherited from the py file. ........
		
			
				
	
	
		
			130 lines
		
	
	
	
		
			3.8 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			130 lines
		
	
	
	
		
			3.8 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python
 | |
| 
 | |
| """\
 | |
| List python source files.
 | |
| 
 | |
| There are three functions to check whether a file is a Python source, listed
 | |
| here with increasing complexity:
 | |
| 
 | |
| - has_python_ext() checks whether a file name ends in '.py[w]'.
 | |
| - look_like_python() checks whether the file is not binary and either has
 | |
|   the '.py[w]' extension or the first line contains the word 'python'.
 | |
| - can_be_compiled() checks whether the file can be compiled by compile().
 | |
| 
 | |
| The file also must be of appropriate size - not bigger than a megabyte.
 | |
| 
 | |
| walk_python_files() recursively lists all Python files under the given directories.
 | |
| """
 | |
| __author__ = "Oleg Broytmann, Georg Brandl"
 | |
| 
 | |
| __all__ = ["has_python_ext", "looks_like_python", "can_be_compiled", "walk_python_files"]
 | |
| 
 | |
| 
 | |
| import os, re
 | |
| 
 | |
| binary_re = re.compile('[\x00-\x08\x0E-\x1F\x7F]')
 | |
| 
 | |
| debug = False
 | |
| 
 | |
| def print_debug(msg):
 | |
|     if debug: print(msg)
 | |
| 
 | |
| 
 | |
| def _open(fullpath):
 | |
|     try:
 | |
|         size = os.stat(fullpath).st_size
 | |
|     except OSError as err: # Permission denied - ignore the file
 | |
|         print_debug("%s: permission denied: %s" % (fullpath, err))
 | |
|         return None
 | |
| 
 | |
|     if size > 1024*1024: # too big
 | |
|         print_debug("%s: the file is too big: %d bytes" % (fullpath, size))
 | |
|         return None
 | |
| 
 | |
|     try:
 | |
|         return open(fullpath, 'rU')
 | |
|     except IOError as err: # Access denied, or a special file - ignore it
 | |
|         print_debug("%s: access denied: %s" % (fullpath, err))
 | |
|         return None
 | |
| 
 | |
| def has_python_ext(fullpath):
 | |
|     return fullpath.endswith(".py") or fullpath.endswith(".pyw")
 | |
| 
 | |
| def looks_like_python(fullpath):
 | |
|     infile = _open(fullpath)
 | |
|     if infile is None:
 | |
|         return False
 | |
| 
 | |
|     line = infile.readline()
 | |
|     infile.close()
 | |
| 
 | |
|     if binary_re.search(line):
 | |
|         # file appears to be binary
 | |
|         print_debug("%s: appears to be binary" % fullpath)
 | |
|         return False
 | |
| 
 | |
|     if fullpath.endswith(".py") or fullpath.endswith(".pyw"):
 | |
|         return True
 | |
|     elif "python" in line:
 | |
|         # disguised Python script (e.g. CGI)
 | |
|         return True
 | |
| 
 | |
|     return False
 | |
| 
 | |
| def can_be_compiled(fullpath):
 | |
|     infile = _open(fullpath)
 | |
|     if infile is None:
 | |
|         return False
 | |
| 
 | |
|     code = infile.read()
 | |
|     infile.close()
 | |
| 
 | |
|     try:
 | |
|         compile(code, fullpath, "exec")
 | |
|     except Exception as err:
 | |
|         print_debug("%s: cannot compile: %s" % (fullpath, err))
 | |
|         return False
 | |
| 
 | |
|     return True
 | |
| 
 | |
| 
 | |
| def walk_python_files(paths, is_python=looks_like_python, exclude_dirs=None):
 | |
|     """\
 | |
|     Recursively yield all Python source files below the given paths.
 | |
| 
 | |
|     paths: a list of files and/or directories to be checked.
 | |
|     is_python: a function that takes a file name and checks whether it is a
 | |
|                Python source file
 | |
|     exclude_dirs: a list of directory base names that should be excluded in
 | |
|                   the search
 | |
|     """
 | |
|     if exclude_dirs is None:
 | |
|         exclude_dirs=[]
 | |
| 
 | |
|     for path in paths:
 | |
|         print_debug("testing: %s" % path)
 | |
|         if os.path.isfile(path):
 | |
|             if is_python(path):
 | |
|                 yield path
 | |
|         elif os.path.isdir(path):
 | |
|             print_debug("    it is a directory")
 | |
|             for dirpath, dirnames, filenames in os.walk(path):
 | |
|                 for exclude in exclude_dirs:
 | |
|                     if exclude in dirnames:
 | |
|                         dirnames.remove(exclude)
 | |
|                 for filename in filenames:
 | |
|                     fullpath = os.path.join(dirpath, filename)
 | |
|                     print_debug("testing: %s" % fullpath)
 | |
|                     if is_python(fullpath):
 | |
|                         yield fullpath
 | |
|         else:
 | |
|             print_debug("    unknown type")
 | |
| 
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     # Two simple examples/tests
 | |
|     for fullpath in walk_python_files(['.']):
 | |
|         print(fullpath)
 | |
|     print("----------")
 | |
|     for fullpath in walk_python_files(['.'], is_python=can_be_compiled):
 | |
|         print(fullpath)
 |