PageRenderTime 387ms CodeModel.GetById 161ms app.highlight 118ms RepoModel.GetById 103ms app.codeStats 0ms

/Tools/scripts/ftpmirror.py

http://unladen-swallow.googlecode.com/
Python | 400 lines | 359 code | 5 blank | 36 comment | 14 complexity | 79dd1fea53d3d4ad26737608f4862572 MD5 | raw file
  1#! /usr/bin/env python
  2
  3"""Mirror a remote ftp subtree into a local directory tree.
  4
  5usage: ftpmirror [-v] [-q] [-i] [-m] [-n] [-r] [-s pat]
  6                 [-l username [-p passwd [-a account]]]
  7                 hostname[:port] [remotedir [localdir]]
  8-v: verbose
  9-q: quiet
 10-i: interactive mode
 11-m: macintosh server (NCSA telnet 2.4) (implies -n -s '*.o')
 12-n: don't log in
 13-r: remove local files/directories no longer pertinent
 14-l username [-p passwd [-a account]]: login info (default .netrc or anonymous)
 15-s pat: skip files matching pattern
 16hostname: remote host w/ optional port separated by ':'
 17remotedir: remote directory (default initial)
 18localdir: local directory (default current)
 19"""
 20
 21import os
 22import sys
 23import time
 24import getopt
 25import ftplib
 26import netrc
 27from fnmatch import fnmatch
 28
 29# Print usage message and exit
 30def usage(*args):
 31    sys.stdout = sys.stderr
 32    for msg in args: print msg
 33    print __doc__
 34    sys.exit(2)
 35
 36verbose = 1 # 0 for -q, 2 for -v
 37interactive = 0
 38mac = 0
 39rmok = 0
 40nologin = 0
 41skippats = ['.', '..', '.mirrorinfo']
 42
 43# Main program: parse command line and start processing
 44def main():
 45    global verbose, interactive, mac, rmok, nologin
 46    try:
 47        opts, args = getopt.getopt(sys.argv[1:], 'a:bil:mnp:qrs:v')
 48    except getopt.error, msg:
 49        usage(msg)
 50    login = ''
 51    passwd = ''
 52    account = ''
 53    if not args: usage('hostname missing')
 54    host = args[0]
 55    port = 0
 56    if ':' in host:
 57        host, port = host.split(':', 1)
 58        port = int(port)
 59    try:
 60        auth = netrc.netrc().authenticators(host)
 61        if auth is not None:
 62            login, account, passwd = auth
 63    except (netrc.NetrcParseError, IOError):
 64        pass
 65    for o, a in opts:
 66        if o == '-l': login = a
 67        if o == '-p': passwd = a
 68        if o == '-a': account = a
 69        if o == '-v': verbose = verbose + 1
 70        if o == '-q': verbose = 0
 71        if o == '-i': interactive = 1
 72        if o == '-m': mac = 1; nologin = 1; skippats.append('*.o')
 73        if o == '-n': nologin = 1
 74        if o == '-r': rmok = 1
 75        if o == '-s': skippats.append(a)
 76    remotedir = ''
 77    localdir = ''
 78    if args[1:]:
 79        remotedir = args[1]
 80        if args[2:]:
 81            localdir = args[2]
 82            if args[3:]: usage('too many arguments')
 83    #
 84    f = ftplib.FTP()
 85    if verbose: print "Connecting to '%s%s'..." % (host,
 86                                                   (port and ":%d"%port or ""))
 87    f.connect(host,port)
 88    if not nologin:
 89        if verbose:
 90            print 'Logging in as %r...' % (login or 'anonymous')
 91        f.login(login, passwd, account)
 92    if verbose: print 'OK.'
 93    pwd = f.pwd()
 94    if verbose > 1: print 'PWD =', repr(pwd)
 95    if remotedir:
 96        if verbose > 1: print 'cwd(%s)' % repr(remotedir)
 97        f.cwd(remotedir)
 98        if verbose > 1: print 'OK.'
 99        pwd = f.pwd()
100        if verbose > 1: print 'PWD =', repr(pwd)
101    #
102    mirrorsubdir(f, localdir)
103
104# Core logic: mirror one subdirectory (recursively)
105def mirrorsubdir(f, localdir):
106    pwd = f.pwd()
107    if localdir and not os.path.isdir(localdir):
108        if verbose: print 'Creating local directory', repr(localdir)
109        try:
110            makedir(localdir)
111        except os.error, msg:
112            print "Failed to establish local directory", repr(localdir)
113            return
114    infofilename = os.path.join(localdir, '.mirrorinfo')
115    try:
116        text = open(infofilename, 'r').read()
117    except IOError, msg:
118        text = '{}'
119    try:
120        info = eval(text)
121    except (SyntaxError, NameError):
122        print 'Bad mirror info in', repr(infofilename)
123        info = {}
124    subdirs = []
125    listing = []
126    if verbose: print 'Listing remote directory %r...' % (pwd,)
127    f.retrlines('LIST', listing.append)
128    filesfound = []
129    for line in listing:
130        if verbose > 1: print '-->', repr(line)
131        if mac:
132            # Mac listing has just filenames;
133            # trailing / means subdirectory
134            filename = line.strip()
135            mode = '-'
136            if filename[-1:] == '/':
137                filename = filename[:-1]
138                mode = 'd'
139            infostuff = ''
140        else:
141            # Parse, assuming a UNIX listing
142            words = line.split(None, 8)
143            if len(words) < 6:
144                if verbose > 1: print 'Skipping short line'
145                continue
146            filename = words[-1].lstrip()
147            i = filename.find(" -> ")
148            if i >= 0:
149                # words[0] had better start with 'l'...
150                if verbose > 1:
151                    print 'Found symbolic link %r' % (filename,)
152                linkto = filename[i+4:]
153                filename = filename[:i]
154            infostuff = words[-5:-1]
155            mode = words[0]
156        skip = 0
157        for pat in skippats:
158            if fnmatch(filename, pat):
159                if verbose > 1:
160                    print 'Skip pattern', repr(pat),
161                    print 'matches', repr(filename)
162                skip = 1
163                break
164        if skip:
165            continue
166        if mode[0] == 'd':
167            if verbose > 1:
168                print 'Remembering subdirectory', repr(filename)
169            subdirs.append(filename)
170            continue
171        filesfound.append(filename)
172        if info.has_key(filename) and info[filename] == infostuff:
173            if verbose > 1:
174                print 'Already have this version of',repr(filename)
175            continue
176        fullname = os.path.join(localdir, filename)
177        tempname = os.path.join(localdir, '@'+filename)
178        if interactive:
179            doit = askabout('file', filename, pwd)
180            if not doit:
181                if not info.has_key(filename):
182                    info[filename] = 'Not retrieved'
183                continue
184        try:
185            os.unlink(tempname)
186        except os.error:
187            pass
188        if mode[0] == 'l':
189            if verbose:
190                print "Creating symlink %r -> %r" % (filename, linkto)
191            try:
192                os.symlink(linkto, tempname)
193            except IOError, msg:
194                print "Can't create %r: %s" % (tempname, msg)
195                continue
196        else:
197            try:
198                fp = open(tempname, 'wb')
199            except IOError, msg:
200                print "Can't create %r: %s" % (tempname, msg)
201                continue
202            if verbose:
203                print 'Retrieving %r from %r as %r...' % (filename, pwd, fullname)
204            if verbose:
205                fp1 = LoggingFile(fp, 1024, sys.stdout)
206            else:
207                fp1 = fp
208            t0 = time.time()
209            try:
210                f.retrbinary('RETR ' + filename,
211                             fp1.write, 8*1024)
212            except ftplib.error_perm, msg:
213                print msg
214            t1 = time.time()
215            bytes = fp.tell()
216            fp.close()
217            if fp1 != fp:
218                fp1.close()
219        try:
220            os.unlink(fullname)
221        except os.error:
222            pass            # Ignore the error
223        try:
224            os.rename(tempname, fullname)
225        except os.error, msg:
226            print "Can't rename %r to %r: %s" % (tempname, fullname, msg)
227            continue
228        info[filename] = infostuff
229        writedict(info, infofilename)
230        if verbose and mode[0] != 'l':
231            dt = t1 - t0
232            kbytes = bytes / 1024.0
233            print int(round(kbytes)),
234            print 'Kbytes in',
235            print int(round(dt)),
236            print 'seconds',
237            if t1 > t0:
238                print '(~%d Kbytes/sec)' % \
239                          int(round(kbytes/dt),)
240            print
241    #
242    # Remove files from info that are no longer remote
243    deletions = 0
244    for filename in info.keys():
245        if filename not in filesfound:
246            if verbose:
247                print "Removing obsolete info entry for",
248                print repr(filename), "in", repr(localdir or ".")
249            del info[filename]
250            deletions = deletions + 1
251    if deletions:
252        writedict(info, infofilename)
253    #
254    # Remove local files that are no longer in the remote directory
255    try:
256        if not localdir: names = os.listdir(os.curdir)
257        else: names = os.listdir(localdir)
258    except os.error:
259        names = []
260    for name in names:
261        if name[0] == '.' or info.has_key(name) or name in subdirs:
262            continue
263        skip = 0
264        for pat in skippats:
265            if fnmatch(name, pat):
266                if verbose > 1:
267                    print 'Skip pattern', repr(pat),
268                    print 'matches', repr(name)
269                skip = 1
270                break
271        if skip:
272            continue
273        fullname = os.path.join(localdir, name)
274        if not rmok:
275            if verbose:
276                print 'Local file', repr(fullname),
277                print 'is no longer pertinent'
278            continue
279        if verbose: print 'Removing local file/dir', repr(fullname)
280        remove(fullname)
281    #
282    # Recursively mirror subdirectories
283    for subdir in subdirs:
284        if interactive:
285            doit = askabout('subdirectory', subdir, pwd)
286            if not doit: continue
287        if verbose: print 'Processing subdirectory', repr(subdir)
288        localsubdir = os.path.join(localdir, subdir)
289        pwd = f.pwd()
290        if verbose > 1:
291            print 'Remote directory now:', repr(pwd)
292            print 'Remote cwd', repr(subdir)
293        try:
294            f.cwd(subdir)
295        except ftplib.error_perm, msg:
296            print "Can't chdir to", repr(subdir), ":", repr(msg)
297        else:
298            if verbose: print 'Mirroring as', repr(localsubdir)
299            mirrorsubdir(f, localsubdir)
300            if verbose > 1: print 'Remote cwd ..'
301            f.cwd('..')
302        newpwd = f.pwd()
303        if newpwd != pwd:
304            print 'Ended up in wrong directory after cd + cd ..'
305            print 'Giving up now.'
306            break
307        else:
308            if verbose > 1: print 'OK.'
309
310# Helper to remove a file or directory tree
311def remove(fullname):
312    if os.path.isdir(fullname) and not os.path.islink(fullname):
313        try:
314            names = os.listdir(fullname)
315        except os.error:
316            names = []
317        ok = 1
318        for name in names:
319            if not remove(os.path.join(fullname, name)):
320                ok = 0
321        if not ok:
322            return 0
323        try:
324            os.rmdir(fullname)
325        except os.error, msg:
326            print "Can't remove local directory %r: %s" % (fullname, msg)
327            return 0
328    else:
329        try:
330            os.unlink(fullname)
331        except os.error, msg:
332            print "Can't remove local file %r: %s" % (fullname, msg)
333            return 0
334    return 1
335
336# Wrapper around a file for writing to write a hash sign every block.
337class LoggingFile:
338    def __init__(self, fp, blocksize, outfp):
339        self.fp = fp
340        self.bytes = 0
341        self.hashes = 0
342        self.blocksize = blocksize
343        self.outfp = outfp
344    def write(self, data):
345        self.bytes = self.bytes + len(data)
346        hashes = int(self.bytes) / self.blocksize
347        while hashes > self.hashes:
348            self.outfp.write('#')
349            self.outfp.flush()
350            self.hashes = self.hashes + 1
351        self.fp.write(data)
352    def close(self):
353        self.outfp.write('\n')
354
355# Ask permission to download a file.
356def askabout(filetype, filename, pwd):
357    prompt = 'Retrieve %s %s from %s ? [ny] ' % (filetype, filename, pwd)
358    while 1:
359        reply = raw_input(prompt).strip().lower()
360        if reply in ['y', 'ye', 'yes']:
361            return 1
362        if reply in ['', 'n', 'no', 'nop', 'nope']:
363            return 0
364        print 'Please answer yes or no.'
365
366# Create a directory if it doesn't exist.  Recursively create the
367# parent directory as well if needed.
368def makedir(pathname):
369    if os.path.isdir(pathname):
370        return
371    dirname = os.path.dirname(pathname)
372    if dirname: makedir(dirname)
373    os.mkdir(pathname, 0777)
374
375# Write a dictionary to a file in a way that can be read back using
376# rval() but is still somewhat readable (i.e. not a single long line).
377# Also creates a backup file.
378def writedict(dict, filename):
379    dir, fname = os.path.split(filename)
380    tempname = os.path.join(dir, '@' + fname)
381    backup = os.path.join(dir, fname + '~')
382    try:
383        os.unlink(backup)
384    except os.error:
385        pass
386    fp = open(tempname, 'w')
387    fp.write('{\n')
388    for key, value in dict.items():
389        fp.write('%r: %r,\n' % (key, value))
390    fp.write('}\n')
391    fp.close()
392    try:
393        os.rename(filename, backup)
394    except os.error:
395        pass
396    os.rename(tempname, filename)
397
398
399if __name__ == '__main__':
400    main()