mirror of
				https://github.com/python/cpython.git
				synced 2025-10-25 10:44:55 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			400 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable file
		
	
	
	
	
			
		
		
	
	
			400 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable file
		
	
	
	
	
| #! /usr/bin/env python
 | |
| 
 | |
| """Mirror a remote ftp subtree into a local directory tree.
 | |
| 
 | |
| usage: ftpmirror [-v] [-q] [-i] [-m] [-n] [-r] [-s pat]
 | |
|                  [-l username [-p passwd [-a account]]]
 | |
|                  hostname[:port] [remotedir [localdir]]
 | |
| -v: verbose
 | |
| -q: quiet
 | |
| -i: interactive mode
 | |
| -m: macintosh server (NCSA telnet 2.4) (implies -n -s '*.o')
 | |
| -n: don't log in
 | |
| -r: remove local files/directories no longer pertinent
 | |
| -l username [-p passwd [-a account]]: login info (default .netrc or anonymous)
 | |
| -s pat: skip files matching pattern
 | |
| hostname: remote host w/ optional port separated by ':'
 | |
| remotedir: remote directory (default initial)
 | |
| localdir: local directory (default current)
 | |
| """
 | |
| 
 | |
| import os
 | |
| import sys
 | |
| import time
 | |
| import getopt
 | |
| import ftplib
 | |
| import netrc
 | |
| from fnmatch import fnmatch
 | |
| 
 | |
| # Print usage message and exit
 | |
| def usage(*args):
 | |
|     sys.stdout = sys.stderr
 | |
|     for msg in args: print msg
 | |
|     print __doc__
 | |
|     sys.exit(2)
 | |
| 
 | |
| verbose = 1 # 0 for -q, 2 for -v
 | |
| interactive = 0
 | |
| mac = 0
 | |
| rmok = 0
 | |
| nologin = 0
 | |
| skippats = ['.', '..', '.mirrorinfo']
 | |
| 
 | |
| # Main program: parse command line and start processing
 | |
| def main():
 | |
|     global verbose, interactive, mac, rmok, nologin
 | |
|     try:
 | |
|         opts, args = getopt.getopt(sys.argv[1:], 'a:bil:mnp:qrs:v')
 | |
|     except getopt.error, msg:
 | |
|         usage(msg)
 | |
|     login = ''
 | |
|     passwd = ''
 | |
|     account = ''
 | |
|     if not args: usage('hostname missing')
 | |
|     host = args[0]
 | |
|     port = 0
 | |
|     if ':' in host:
 | |
|         host, port = host.split(':', 1)
 | |
|         port = int(port)
 | |
|     try:
 | |
|         auth = netrc.netrc().authenticators(host)
 | |
|         if auth is not None:
 | |
|             login, account, passwd = auth
 | |
|     except (netrc.NetrcParseError, IOError):
 | |
|         pass
 | |
|     for o, a in opts:
 | |
|         if o == '-l': login = a
 | |
|         if o == '-p': passwd = a
 | |
|         if o == '-a': account = a
 | |
|         if o == '-v': verbose = verbose + 1
 | |
|         if o == '-q': verbose = 0
 | |
|         if o == '-i': interactive = 1
 | |
|         if o == '-m': mac = 1; nologin = 1; skippats.append('*.o')
 | |
|         if o == '-n': nologin = 1
 | |
|         if o == '-r': rmok = 1
 | |
|         if o == '-s': skippats.append(a)
 | |
|     remotedir = ''
 | |
|     localdir = ''
 | |
|     if args[1:]:
 | |
|         remotedir = args[1]
 | |
|         if args[2:]:
 | |
|             localdir = args[2]
 | |
|             if args[3:]: usage('too many arguments')
 | |
|     #
 | |
|     f = ftplib.FTP()
 | |
|     if verbose: print "Connecting to '%s%s'..." % (host,
 | |
|                                                    (port and ":%d"%port or ""))
 | |
|     f.connect(host,port)
 | |
|     if not nologin:
 | |
|         if verbose:
 | |
|             print 'Logging in as %r...' % (login or 'anonymous')
 | |
|         f.login(login, passwd, account)
 | |
|     if verbose: print 'OK.'
 | |
|     pwd = f.pwd()
 | |
|     if verbose > 1: print 'PWD =', repr(pwd)
 | |
|     if remotedir:
 | |
|         if verbose > 1: print 'cwd(%s)' % repr(remotedir)
 | |
|         f.cwd(remotedir)
 | |
|         if verbose > 1: print 'OK.'
 | |
|         pwd = f.pwd()
 | |
|         if verbose > 1: print 'PWD =', repr(pwd)
 | |
|     #
 | |
|     mirrorsubdir(f, localdir)
 | |
| 
 | |
| # Core logic: mirror one subdirectory (recursively)
 | |
| def mirrorsubdir(f, localdir):
 | |
|     pwd = f.pwd()
 | |
|     if localdir and not os.path.isdir(localdir):
 | |
|         if verbose: print 'Creating local directory', repr(localdir)
 | |
|         try:
 | |
|             makedir(localdir)
 | |
|         except os.error, msg:
 | |
|             print "Failed to establish local directory", repr(localdir)
 | |
|             return
 | |
|     infofilename = os.path.join(localdir, '.mirrorinfo')
 | |
|     try:
 | |
|         text = open(infofilename, 'r').read()
 | |
|     except IOError, msg:
 | |
|         text = '{}'
 | |
|     try:
 | |
|         info = eval(text)
 | |
|     except (SyntaxError, NameError):
 | |
|         print 'Bad mirror info in', repr(infofilename)
 | |
|         info = {}
 | |
|     subdirs = []
 | |
|     listing = []
 | |
|     if verbose: print 'Listing remote directory %r...' % (pwd,)
 | |
|     f.retrlines('LIST', listing.append)
 | |
|     filesfound = []
 | |
|     for line in listing:
 | |
|         if verbose > 1: print '-->', repr(line)
 | |
|         if mac:
 | |
|             # Mac listing has just filenames;
 | |
|             # trailing / means subdirectory
 | |
|             filename = line.strip()
 | |
|             mode = '-'
 | |
|             if filename[-1:] == '/':
 | |
|                 filename = filename[:-1]
 | |
|                 mode = 'd'
 | |
|             infostuff = ''
 | |
|         else:
 | |
|             # Parse, assuming a UNIX listing
 | |
|             words = line.split(None, 8)
 | |
|             if len(words) < 6:
 | |
|                 if verbose > 1: print 'Skipping short line'
 | |
|                 continue
 | |
|             filename = words[-1].lstrip()
 | |
|             i = filename.find(" -> ")
 | |
|             if i >= 0:
 | |
|                 # words[0] had better start with 'l'...
 | |
|                 if verbose > 1:
 | |
|                     print 'Found symbolic link %r' % (filename,)
 | |
|                 linkto = filename[i+4:]
 | |
|                 filename = filename[:i]
 | |
|             infostuff = words[-5:-1]
 | |
|             mode = words[0]
 | |
|         skip = 0
 | |
|         for pat in skippats:
 | |
|             if fnmatch(filename, pat):
 | |
|                 if verbose > 1:
 | |
|                     print 'Skip pattern', repr(pat),
 | |
|                     print 'matches', repr(filename)
 | |
|                 skip = 1
 | |
|                 break
 | |
|         if skip:
 | |
|             continue
 | |
|         if mode[0] == 'd':
 | |
|             if verbose > 1:
 | |
|                 print 'Remembering subdirectory', repr(filename)
 | |
|             subdirs.append(filename)
 | |
|             continue
 | |
|         filesfound.append(filename)
 | |
|         if info.has_key(filename) and info[filename] == infostuff:
 | |
|             if verbose > 1:
 | |
|                 print 'Already have this version of',repr(filename)
 | |
|             continue
 | |
|         fullname = os.path.join(localdir, filename)
 | |
|         tempname = os.path.join(localdir, '@'+filename)
 | |
|         if interactive:
 | |
|             doit = askabout('file', filename, pwd)
 | |
|             if not doit:
 | |
|                 if not info.has_key(filename):
 | |
|                     info[filename] = 'Not retrieved'
 | |
|                 continue
 | |
|         try:
 | |
|             os.unlink(tempname)
 | |
|         except os.error:
 | |
|             pass
 | |
|         if mode[0] == 'l':
 | |
|             if verbose:
 | |
|                 print "Creating symlink %r -> %r" % (filename, linkto)
 | |
|             try:
 | |
|                 os.symlink(linkto, tempname)
 | |
|             except IOError, msg:
 | |
|                 print "Can't create %r: %s" % (tempname, msg)
 | |
|                 continue
 | |
|         else:
 | |
|             try:
 | |
|                 fp = open(tempname, 'wb')
 | |
|             except IOError, msg:
 | |
|                 print "Can't create %r: %s" % (tempname, msg)
 | |
|                 continue
 | |
|             if verbose:
 | |
|                 print 'Retrieving %r from %r as %r...' % (filename, pwd, fullname)
 | |
|             if verbose:
 | |
|                 fp1 = LoggingFile(fp, 1024, sys.stdout)
 | |
|             else:
 | |
|                 fp1 = fp
 | |
|             t0 = time.time()
 | |
|             try:
 | |
|                 f.retrbinary('RETR ' + filename,
 | |
|                              fp1.write, 8*1024)
 | |
|             except ftplib.error_perm, msg:
 | |
|                 print msg
 | |
|             t1 = time.time()
 | |
|             bytes = fp.tell()
 | |
|             fp.close()
 | |
|             if fp1 != fp:
 | |
|                 fp1.close()
 | |
|         try:
 | |
|             os.unlink(fullname)
 | |
|         except os.error:
 | |
|             pass            # Ignore the error
 | |
|         try:
 | |
|             os.rename(tempname, fullname)
 | |
|         except os.error, msg:
 | |
|             print "Can't rename %r to %r: %s" % (tempname, fullname, msg)
 | |
|             continue
 | |
|         info[filename] = infostuff
 | |
|         writedict(info, infofilename)
 | |
|         if verbose and mode[0] != 'l':
 | |
|             dt = t1 - t0
 | |
|             kbytes = bytes / 1024.0
 | |
|             print int(round(kbytes)),
 | |
|             print 'Kbytes in',
 | |
|             print int(round(dt)),
 | |
|             print 'seconds',
 | |
|             if t1 > t0:
 | |
|                 print '(~%d Kbytes/sec)' % \
 | |
|                           int(round(kbytes/dt),)
 | |
|             print
 | |
|     #
 | |
|     # Remove files from info that are no longer remote
 | |
|     deletions = 0
 | |
|     for filename in info.keys():
 | |
|         if filename not in filesfound:
 | |
|             if verbose:
 | |
|                 print "Removing obsolete info entry for",
 | |
|                 print repr(filename), "in", repr(localdir or ".")
 | |
|             del info[filename]
 | |
|             deletions = deletions + 1
 | |
|     if deletions:
 | |
|         writedict(info, infofilename)
 | |
|     #
 | |
|     # Remove local files that are no longer in the remote directory
 | |
|     try:
 | |
|         if not localdir: names = os.listdir(os.curdir)
 | |
|         else: names = os.listdir(localdir)
 | |
|     except os.error:
 | |
|         names = []
 | |
|     for name in names:
 | |
|         if name[0] == '.' or info.has_key(name) or name in subdirs:
 | |
|             continue
 | |
|         skip = 0
 | |
|         for pat in skippats:
 | |
|             if fnmatch(name, pat):
 | |
|                 if verbose > 1:
 | |
|                     print 'Skip pattern', repr(pat),
 | |
|                     print 'matches', repr(name)
 | |
|                 skip = 1
 | |
|                 break
 | |
|         if skip:
 | |
|             continue
 | |
|         fullname = os.path.join(localdir, name)
 | |
|         if not rmok:
 | |
|             if verbose:
 | |
|                 print 'Local file', repr(fullname),
 | |
|                 print 'is no longer pertinent'
 | |
|             continue
 | |
|         if verbose: print 'Removing local file/dir', repr(fullname)
 | |
|         remove(fullname)
 | |
|     #
 | |
|     # Recursively mirror subdirectories
 | |
|     for subdir in subdirs:
 | |
|         if interactive:
 | |
|             doit = askabout('subdirectory', subdir, pwd)
 | |
|             if not doit: continue
 | |
|         if verbose: print 'Processing subdirectory', repr(subdir)
 | |
|         localsubdir = os.path.join(localdir, subdir)
 | |
|         pwd = f.pwd()
 | |
|         if verbose > 1:
 | |
|             print 'Remote directory now:', repr(pwd)
 | |
|             print 'Remote cwd', repr(subdir)
 | |
|         try:
 | |
|             f.cwd(subdir)
 | |
|         except ftplib.error_perm, msg:
 | |
|             print "Can't chdir to", repr(subdir), ":", repr(msg)
 | |
|         else:
 | |
|             if verbose: print 'Mirroring as', repr(localsubdir)
 | |
|             mirrorsubdir(f, localsubdir)
 | |
|             if verbose > 1: print 'Remote cwd ..'
 | |
|             f.cwd('..')
 | |
|         newpwd = f.pwd()
 | |
|         if newpwd != pwd:
 | |
|             print 'Ended up in wrong directory after cd + cd ..'
 | |
|             print 'Giving up now.'
 | |
|             break
 | |
|         else:
 | |
|             if verbose > 1: print 'OK.'
 | |
| 
 | |
| # Helper to remove a file or directory tree
 | |
| def remove(fullname):
 | |
|     if os.path.isdir(fullname) and not os.path.islink(fullname):
 | |
|         try:
 | |
|             names = os.listdir(fullname)
 | |
|         except os.error:
 | |
|             names = []
 | |
|         ok = 1
 | |
|         for name in names:
 | |
|             if not remove(os.path.join(fullname, name)):
 | |
|                 ok = 0
 | |
|         if not ok:
 | |
|             return 0
 | |
|         try:
 | |
|             os.rmdir(fullname)
 | |
|         except os.error, msg:
 | |
|             print "Can't remove local directory %r: %s" % (fullname, msg)
 | |
|             return 0
 | |
|     else:
 | |
|         try:
 | |
|             os.unlink(fullname)
 | |
|         except os.error, msg:
 | |
|             print "Can't remove local file %r: %s" % (fullname, msg)
 | |
|             return 0
 | |
|     return 1
 | |
| 
 | |
| # Wrapper around a file for writing to write a hash sign every block.
 | |
| class LoggingFile:
 | |
|     def __init__(self, fp, blocksize, outfp):
 | |
|         self.fp = fp
 | |
|         self.bytes = 0
 | |
|         self.hashes = 0
 | |
|         self.blocksize = blocksize
 | |
|         self.outfp = outfp
 | |
|     def write(self, data):
 | |
|         self.bytes = self.bytes + len(data)
 | |
|         hashes = int(self.bytes) / self.blocksize
 | |
|         while hashes > self.hashes:
 | |
|             self.outfp.write('#')
 | |
|             self.outfp.flush()
 | |
|             self.hashes = self.hashes + 1
 | |
|         self.fp.write(data)
 | |
|     def close(self):
 | |
|         self.outfp.write('\n')
 | |
| 
 | |
| # Ask permission to download a file.
 | |
| def askabout(filetype, filename, pwd):
 | |
|     prompt = 'Retrieve %s %s from %s ? [ny] ' % (filetype, filename, pwd)
 | |
|     while 1:
 | |
|         reply = raw_input(prompt).strip().lower()
 | |
|         if reply in ['y', 'ye', 'yes']:
 | |
|             return 1
 | |
|         if reply in ['', 'n', 'no', 'nop', 'nope']:
 | |
|             return 0
 | |
|         print 'Please answer yes or no.'
 | |
| 
 | |
| # Create a directory if it doesn't exist.  Recursively create the
 | |
| # parent directory as well if needed.
 | |
| def makedir(pathname):
 | |
|     if os.path.isdir(pathname):
 | |
|         return
 | |
|     dirname = os.path.dirname(pathname)
 | |
|     if dirname: makedir(dirname)
 | |
|     os.mkdir(pathname, 0777)
 | |
| 
 | |
| # Write a dictionary to a file in a way that can be read back using
 | |
| # rval() but is still somewhat readable (i.e. not a single long line).
 | |
| # Also creates a backup file.
 | |
| def writedict(dict, filename):
 | |
|     dir, fname = os.path.split(filename)
 | |
|     tempname = os.path.join(dir, '@' + fname)
 | |
|     backup = os.path.join(dir, fname + '~')
 | |
|     try:
 | |
|         os.unlink(backup)
 | |
|     except os.error:
 | |
|         pass
 | |
|     fp = open(tempname, 'w')
 | |
|     fp.write('{\n')
 | |
|     for key, value in dict.items():
 | |
|         fp.write('%r: %r,\n' % (key, value))
 | |
|     fp.write('}\n')
 | |
|     fp.close()
 | |
|     try:
 | |
|         os.rename(filename, backup)
 | |
|     except os.error:
 | |
|         pass
 | |
|     os.rename(tempname, filename)
 | |
| 
 | |
| 
 | |
| if __name__ == '__main__':
 | |
|     main()
 | 
