406 lines
13 KiB
Python
Executable File
406 lines
13 KiB
Python
Executable File
#! /usr/bin/env python3
|
|
|
|
"""Mirror a remote ftp subtree into a local directory tree.
|
|
|
|
usage: ftpmirror [-v] [-q] [-i] [-m] [-n] [-r] [-s pat]
|
|
[-l username [-p passwd [-a account]]]
|
|
hostname[:port] [remotedir [localdir]]
|
|
-v: verbose
|
|
-q: quiet
|
|
-i: interactive mode
|
|
-m: macintosh server (NCSA telnet 2.4) (implies -n -s '*.o')
|
|
-n: don't log in
|
|
-r: remove local files/directories no longer pertinent
|
|
-l username [-p passwd [-a account]]: login info (default .netrc or anonymous)
|
|
-s pat: skip files matching pattern
|
|
hostname: remote host w/ optional port separated by ':'
|
|
remotedir: remote directory (default initial)
|
|
localdir: local directory (default current)
|
|
"""
|
|
|
|
import os
|
|
import sys
|
|
import time
|
|
import getopt
|
|
import ftplib
|
|
import netrc
|
|
from fnmatch import fnmatch
|
|
|
|
# Print usage message and exit
|
|
def usage(*args):
|
|
sys.stdout = sys.stderr
|
|
for msg in args: print(msg)
|
|
print(__doc__)
|
|
sys.exit(2)
|
|
|
|
verbose = 1 # 0 for -q, 2 for -v
|
|
interactive = 0
|
|
mac = 0
|
|
rmok = 0
|
|
nologin = 0
|
|
skippats = ['.', '..', '.mirrorinfo']
|
|
|
|
# Main program: parse command line and start processing
|
|
def main():
|
|
global verbose, interactive, mac, rmok, nologin
|
|
try:
|
|
opts, args = getopt.getopt(sys.argv[1:], 'a:bil:mnp:qrs:v')
|
|
except getopt.error as msg:
|
|
usage(msg)
|
|
login = ''
|
|
passwd = ''
|
|
account = ''
|
|
if not args: usage('hostname missing')
|
|
host = args[0]
|
|
port = 0
|
|
if ':' in host:
|
|
host, port = host.split(':', 1)
|
|
port = int(port)
|
|
try:
|
|
auth = netrc.netrc().authenticators(host)
|
|
if auth is not None:
|
|
login, account, passwd = auth
|
|
except (netrc.NetrcParseError, IOError):
|
|
pass
|
|
for o, a in opts:
|
|
if o == '-l': login = a
|
|
if o == '-p': passwd = a
|
|
if o == '-a': account = a
|
|
if o == '-v': verbose = verbose + 1
|
|
if o == '-q': verbose = 0
|
|
if o == '-i': interactive = 1
|
|
if o == '-m': mac = 1; nologin = 1; skippats.append('*.o')
|
|
if o == '-n': nologin = 1
|
|
if o == '-r': rmok = 1
|
|
if o == '-s': skippats.append(a)
|
|
remotedir = ''
|
|
localdir = ''
|
|
if args[1:]:
|
|
remotedir = args[1]
|
|
if args[2:]:
|
|
localdir = args[2]
|
|
if args[3:]: usage('too many arguments')
|
|
#
|
|
f = ftplib.FTP()
|
|
if verbose: print("Connecting to '%s%s'..." % (host,
|
|
(port and ":%d"%port or "")))
|
|
f.connect(host,port)
|
|
if not nologin:
|
|
if verbose:
|
|
print('Logging in as %r...' % (login or 'anonymous'))
|
|
f.login(login, passwd, account)
|
|
if verbose: print('OK.')
|
|
pwd = f.pwd()
|
|
if verbose > 1: print('PWD =', repr(pwd))
|
|
if remotedir:
|
|
if verbose > 1: print('cwd(%s)' % repr(remotedir))
|
|
f.cwd(remotedir)
|
|
if verbose > 1: print('OK.')
|
|
pwd = f.pwd()
|
|
if verbose > 1: print('PWD =', repr(pwd))
|
|
#
|
|
mirrorsubdir(f, localdir)
|
|
|
|
# Core logic: mirror one subdirectory (recursively)
|
|
def mirrorsubdir(f, localdir):
|
|
pwd = f.pwd()
|
|
if localdir and not os.path.isdir(localdir):
|
|
if verbose: print('Creating local directory', repr(localdir))
|
|
try:
|
|
makedir(localdir)
|
|
except OSError as msg:
|
|
print("Failed to establish local directory", repr(localdir))
|
|
return
|
|
infofilename = os.path.join(localdir, '.mirrorinfo')
|
|
try:
|
|
text = open(infofilename, 'r').read()
|
|
except IOError as msg:
|
|
text = '{}'
|
|
try:
|
|
info = eval(text)
|
|
except (SyntaxError, NameError):
|
|
print('Bad mirror info in', repr(infofilename))
|
|
info = {}
|
|
subdirs = []
|
|
listing = []
|
|
if verbose: print('Listing remote directory %r...' % (pwd,))
|
|
f.retrlines('LIST', listing.append)
|
|
filesfound = []
|
|
for line in listing:
|
|
if verbose > 1: print('-->', repr(line))
|
|
if mac:
|
|
# Mac listing has just filenames;
|
|
# trailing / means subdirectory
|
|
filename = line.strip()
|
|
mode = '-'
|
|
if filename[-1:] == '/':
|
|
filename = filename[:-1]
|
|
mode = 'd'
|
|
infostuff = ''
|
|
else:
|
|
# Parse, assuming a UNIX listing
|
|
words = line.split(None, 8)
|
|
if len(words) < 6:
|
|
if verbose > 1: print('Skipping short line')
|
|
continue
|
|
filename = words[-1].lstrip()
|
|
i = filename.find(" -> ")
|
|
if i >= 0:
|
|
# words[0] had better start with 'l'...
|
|
if verbose > 1:
|
|
print('Found symbolic link %r' % (filename,))
|
|
linkto = filename[i+4:]
|
|
filename = filename[:i]
|
|
infostuff = words[-5:-1]
|
|
mode = words[0]
|
|
skip = 0
|
|
for pat in skippats:
|
|
if fnmatch(filename, pat):
|
|
if verbose > 1:
|
|
print('Skip pattern', repr(pat), end=' ')
|
|
print('matches', repr(filename))
|
|
skip = 1
|
|
break
|
|
if skip:
|
|
continue
|
|
if mode[0] == 'd':
|
|
if verbose > 1:
|
|
print('Remembering subdirectory', repr(filename))
|
|
subdirs.append(filename)
|
|
continue
|
|
filesfound.append(filename)
|
|
if filename in info and info[filename] == infostuff:
|
|
if verbose > 1:
|
|
print('Already have this version of',repr(filename))
|
|
continue
|
|
fullname = os.path.join(localdir, filename)
|
|
tempname = os.path.join(localdir, '@'+filename)
|
|
if interactive:
|
|
doit = askabout('file', filename, pwd)
|
|
if not doit:
|
|
if filename not in info:
|
|
info[filename] = 'Not retrieved'
|
|
continue
|
|
try:
|
|
os.unlink(tempname)
|
|
except OSError:
|
|
pass
|
|
if mode[0] == 'l':
|
|
if verbose:
|
|
print("Creating symlink %r -> %r" % (filename, linkto))
|
|
try:
|
|
os.symlink(linkto, tempname)
|
|
except IOError as msg:
|
|
print("Can't create %r: %s" % (tempname, msg))
|
|
continue
|
|
else:
|
|
try:
|
|
fp = open(tempname, 'wb')
|
|
except IOError as msg:
|
|
print("Can't create %r: %s" % (tempname, msg))
|
|
continue
|
|
if verbose:
|
|
print('Retrieving %r from %r as %r...' % (filename, pwd, fullname))
|
|
if verbose:
|
|
fp1 = LoggingFile(fp, 1024, sys.stdout)
|
|
else:
|
|
fp1 = fp
|
|
t0 = time.time()
|
|
try:
|
|
f.retrbinary('RETR ' + filename,
|
|
fp1.write, 8*1024)
|
|
except ftplib.error_perm as msg:
|
|
print(msg)
|
|
t1 = time.time()
|
|
bytes = fp.tell()
|
|
fp.close()
|
|
if fp1 != fp:
|
|
fp1.close()
|
|
try:
|
|
os.unlink(fullname)
|
|
except OSError:
|
|
pass # Ignore the error
|
|
try:
|
|
os.rename(tempname, fullname)
|
|
except OSError as msg:
|
|
print("Can't rename %r to %r: %s" % (tempname, fullname, msg))
|
|
continue
|
|
info[filename] = infostuff
|
|
writedict(info, infofilename)
|
|
if verbose and mode[0] != 'l':
|
|
dt = t1 - t0
|
|
kbytes = bytes / 1024.0
|
|
print(int(round(kbytes)), end=' ')
|
|
print('Kbytes in', end=' ')
|
|
print(int(round(dt)), end=' ')
|
|
print('seconds', end=' ')
|
|
if t1 > t0:
|
|
print('(~%d Kbytes/sec)' % \
|
|
int(round(kbytes/dt),))
|
|
print()
|
|
#
|
|
# Remove files from info that are no longer remote
|
|
deletions = 0
|
|
for filename in list(info.keys()):
|
|
if filename not in filesfound:
|
|
if verbose:
|
|
print("Removing obsolete info entry for", end=' ')
|
|
print(repr(filename), "in", repr(localdir or "."))
|
|
del info[filename]
|
|
deletions = deletions + 1
|
|
if deletions:
|
|
writedict(info, infofilename)
|
|
#
|
|
# Remove local files that are no longer in the remote directory
|
|
try:
|
|
if not localdir: names = os.listdir(os.curdir)
|
|
else: names = os.listdir(localdir)
|
|
except OSError:
|
|
names = []
|
|
for name in names:
|
|
if name[0] == '.' or name in info or name in subdirs:
|
|
continue
|
|
skip = 0
|
|
for pat in skippats:
|
|
if fnmatch(name, pat):
|
|
if verbose > 1:
|
|
print('Skip pattern', repr(pat), end=' ')
|
|
print('matches', repr(name))
|
|
skip = 1
|
|
break
|
|
if skip:
|
|
continue
|
|
fullname = os.path.join(localdir, name)
|
|
if not rmok:
|
|
if verbose:
|
|
print('Local file', repr(fullname), end=' ')
|
|
print('is no longer pertinent')
|
|
continue
|
|
if verbose: print('Removing local file/dir', repr(fullname))
|
|
remove(fullname)
|
|
#
|
|
# Recursively mirror subdirectories
|
|
for subdir in subdirs:
|
|
if interactive:
|
|
doit = askabout('subdirectory', subdir, pwd)
|
|
if not doit: continue
|
|
if verbose: print('Processing subdirectory', repr(subdir))
|
|
localsubdir = os.path.join(localdir, subdir)
|
|
pwd = f.pwd()
|
|
if verbose > 1:
|
|
print('Remote directory now:', repr(pwd))
|
|
print('Remote cwd', repr(subdir))
|
|
try:
|
|
f.cwd(subdir)
|
|
except ftplib.error_perm as msg:
|
|
print("Can't chdir to", repr(subdir), ":", repr(msg))
|
|
else:
|
|
if verbose: print('Mirroring as', repr(localsubdir))
|
|
mirrorsubdir(f, localsubdir)
|
|
if verbose > 1: print('Remote cwd ..')
|
|
f.cwd('..')
|
|
newpwd = f.pwd()
|
|
if newpwd != pwd:
|
|
print('Ended up in wrong directory after cd + cd ..')
|
|
print('Giving up now.')
|
|
break
|
|
else:
|
|
if verbose > 1: print('OK.')
|
|
|
|
# Helper to remove a file or directory tree
|
|
def remove(fullname):
|
|
if os.path.isdir(fullname) and not os.path.islink(fullname):
|
|
try:
|
|
names = os.listdir(fullname)
|
|
except OSError:
|
|
names = []
|
|
ok = 1
|
|
for name in names:
|
|
if not remove(os.path.join(fullname, name)):
|
|
ok = 0
|
|
if not ok:
|
|
return 0
|
|
try:
|
|
os.rmdir(fullname)
|
|
except OSError as msg:
|
|
print("Can't remove local directory %r: %s" % (fullname, msg))
|
|
return 0
|
|
else:
|
|
try:
|
|
os.unlink(fullname)
|
|
except OSError as msg:
|
|
print("Can't remove local file %r: %s" % (fullname, msg))
|
|
return 0
|
|
return 1
|
|
|
|
# Wrapper around a file for writing to write a hash sign every block.
|
|
class LoggingFile:
|
|
def __init__(self, fp, blocksize, outfp):
|
|
self.fp = fp
|
|
self.bytes = 0
|
|
self.hashes = 0
|
|
self.blocksize = blocksize
|
|
self.outfp = outfp
|
|
def write(self, data):
|
|
self.bytes = self.bytes + len(data)
|
|
hashes = int(self.bytes) / self.blocksize
|
|
while hashes > self.hashes:
|
|
self.outfp.write('#')
|
|
self.outfp.flush()
|
|
self.hashes = self.hashes + 1
|
|
self.fp.write(data)
|
|
def close(self):
|
|
self.outfp.write('\n')
|
|
|
|
def raw_input(prompt):
|
|
sys.stdout.write(prompt)
|
|
sys.stdout.flush()
|
|
return sys.stdin.readline()
|
|
|
|
# Ask permission to download a file.
|
|
def askabout(filetype, filename, pwd):
|
|
prompt = 'Retrieve %s %s from %s ? [ny] ' % (filetype, filename, pwd)
|
|
while 1:
|
|
reply = raw_input(prompt).strip().lower()
|
|
if reply in ['y', 'ye', 'yes']:
|
|
return 1
|
|
if reply in ['', 'n', 'no', 'nop', 'nope']:
|
|
return 0
|
|
print('Please answer yes or no.')
|
|
|
|
# Create a directory if it doesn't exist. Recursively create the
|
|
# parent directory as well if needed.
|
|
def makedir(pathname):
|
|
if os.path.isdir(pathname):
|
|
return
|
|
dirname = os.path.dirname(pathname)
|
|
if dirname: makedir(dirname)
|
|
os.mkdir(pathname, 0o777)
|
|
|
|
# Write a dictionary to a file in a way that can be read back using
|
|
# rval() but is still somewhat readable (i.e. not a single long line).
|
|
# Also creates a backup file.
|
|
def writedict(dict, filename):
|
|
dir, fname = os.path.split(filename)
|
|
tempname = os.path.join(dir, '@' + fname)
|
|
backup = os.path.join(dir, fname + '~')
|
|
try:
|
|
os.unlink(backup)
|
|
except OSError:
|
|
pass
|
|
fp = open(tempname, 'w')
|
|
fp.write('{\n')
|
|
for key, value in dict.items():
|
|
fp.write('%r: %r,\n' % (key, value))
|
|
fp.write('}\n')
|
|
fp.close()
|
|
try:
|
|
os.rename(filename, backup)
|
|
except OSError:
|
|
pass
|
|
os.rename(tempname, filename)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
main()
|