PageRenderTime 125ms CodeModel.GetById 61ms app.highlight 23ms RepoModel.GetById 37ms app.codeStats 0ms

/Tools/scripts/cleanfuture.py

http://unladen-swallow.googlecode.com/
Python | 276 lines | 253 code | 7 blank | 16 comment | 7 complexity | 5e039e3ec0eacc7c00bdbd82c52a82e3 MD5 | raw file
  1#! /usr/bin/env python
  2
  3"""cleanfuture [-d][-r][-v] path ...
  4
  5-d  Dry run.  Analyze, but don't make any changes to, files.
  6-r  Recurse.  Search for all .py files in subdirectories too.
  7-v  Verbose.  Print informative msgs.
  8
  9Search Python (.py) files for future statements, and remove the features
 10from such statements that are already mandatory in the version of Python
 11you're using.
 12
 13Pass one or more file and/or directory paths.  When a directory path, all
 14.py files within the directory will be examined, and, if the -r option is
 15given, likewise recursively for subdirectories.
 16
 17Overwrites files in place, renaming the originals with a .bak extension. If
 18cleanfuture finds nothing to change, the file is left alone.  If cleanfuture
 19does change a file, the changed file is a fixed-point (i.e., running
 20cleanfuture on the resulting .py file won't change it again, at least not
 21until you try it again with a later Python release).
 22
 23Limitations:  You can do these things, but this tool won't help you then:
 24
 25+ A future statement cannot be mixed with any other statement on the same
 26  physical line (separated by semicolon).
 27
 28+ A future statement cannot contain an "as" clause.
 29
 30Example:  Assuming you're using Python 2.2, if a file containing
 31
 32from __future__ import nested_scopes, generators
 33
 34is analyzed by cleanfuture, the line is rewritten to
 35
 36from __future__ import generators
 37
 38because nested_scopes is no longer optional in 2.2 but generators is.
 39"""
 40
 41import __future__
 42import tokenize
 43import os
 44import sys
 45
 46dryrun  = 0
 47recurse = 0
 48verbose = 0
 49
 50def errprint(*args):
 51    strings = map(str, args)
 52    msg = ' '.join(strings)
 53    if msg[-1:] != '\n':
 54        msg += '\n'
 55    sys.stderr.write(msg)
 56
 57def main():
 58    import getopt
 59    global verbose, recurse, dryrun
 60    try:
 61        opts, args = getopt.getopt(sys.argv[1:], "drv")
 62    except getopt.error, msg:
 63        errprint(msg)
 64        return
 65    for o, a in opts:
 66        if o == '-d':
 67            dryrun += 1
 68        elif o == '-r':
 69            recurse += 1
 70        elif o == '-v':
 71            verbose += 1
 72    if not args:
 73        errprint("Usage:", __doc__)
 74        return
 75    for arg in args:
 76        check(arg)
 77
 78def check(file):
 79    if os.path.isdir(file) and not os.path.islink(file):
 80        if verbose:
 81            print "listing directory", file
 82        names = os.listdir(file)
 83        for name in names:
 84            fullname = os.path.join(file, name)
 85            if ((recurse and os.path.isdir(fullname) and
 86                 not os.path.islink(fullname))
 87                or name.lower().endswith(".py")):
 88                check(fullname)
 89        return
 90
 91    if verbose:
 92        print "checking", file, "...",
 93    try:
 94        f = open(file)
 95    except IOError, msg:
 96        errprint("%r: I/O Error: %s" % (file, str(msg)))
 97        return
 98
 99    ff = FutureFinder(f, file)
100    changed = ff.run()
101    if changed:
102        ff.gettherest()
103    f.close()
104    if changed:
105        if verbose:
106            print "changed."
107            if dryrun:
108                print "But this is a dry run, so leaving it alone."
109        for s, e, line in changed:
110            print "%r lines %d-%d" % (file, s+1, e+1)
111            for i in range(s, e+1):
112                print ff.lines[i],
113            if line is None:
114                print "-- deleted"
115            else:
116                print "-- change to:"
117                print line,
118        if not dryrun:
119            bak = file + ".bak"
120            if os.path.exists(bak):
121                os.remove(bak)
122            os.rename(file, bak)
123            if verbose:
124                print "renamed", file, "to", bak
125            g = open(file, "w")
126            ff.write(g)
127            g.close()
128            if verbose:
129                print "wrote new", file
130    else:
131        if verbose:
132            print "unchanged."
133
134class FutureFinder:
135
136    def __init__(self, f, fname):
137        self.f = f
138        self.fname = fname
139        self.ateof = 0
140        self.lines = [] # raw file lines
141
142        # List of (start_index, end_index, new_line) triples.
143        self.changed = []
144
145    # Line-getter for tokenize.
146    def getline(self):
147        if self.ateof:
148            return ""
149        line = self.f.readline()
150        if line == "":
151            self.ateof = 1
152        else:
153            self.lines.append(line)
154        return line
155
156    def run(self):
157        STRING = tokenize.STRING
158        NL = tokenize.NL
159        NEWLINE = tokenize.NEWLINE
160        COMMENT = tokenize.COMMENT
161        NAME = tokenize.NAME
162        OP = tokenize.OP
163
164        changed = self.changed
165        get = tokenize.generate_tokens(self.getline).next
166        type, token, (srow, scol), (erow, ecol), line = get()
167
168        # Chew up initial comments and blank lines (if any).
169        while type in (COMMENT, NL, NEWLINE):
170            type, token, (srow, scol), (erow, ecol), line = get()
171
172        # Chew up docstring (if any -- and it may be implicitly catenated!).
173        while type is STRING:
174            type, token, (srow, scol), (erow, ecol), line = get()
175
176        # Analyze the future stmts.
177        while 1:
178            # Chew up comments and blank lines (if any).
179            while type in (COMMENT, NL, NEWLINE):
180                type, token, (srow, scol), (erow, ecol), line = get()
181
182            if not (type is NAME and token == "from"):
183                break
184            startline = srow - 1    # tokenize is one-based
185            type, token, (srow, scol), (erow, ecol), line = get()
186
187            if not (type is NAME and token == "__future__"):
188                break
189            type, token, (srow, scol), (erow, ecol), line = get()
190
191            if not (type is NAME and token == "import"):
192                break
193            type, token, (srow, scol), (erow, ecol), line = get()
194
195            # Get the list of features.
196            features = []
197            while type is NAME:
198                features.append(token)
199                type, token, (srow, scol), (erow, ecol), line = get()
200
201                if not (type is OP and token == ','):
202                    break
203                type, token, (srow, scol), (erow, ecol), line = get()
204
205            # A trailing comment?
206            comment = None
207            if type is COMMENT:
208                comment = token
209                type, token, (srow, scol), (erow, ecol), line = get()
210
211            if type is not NEWLINE:
212                errprint("Skipping file %r; can't parse line %d:\n%s" %
213                         (self.fname, srow, line))
214                return []
215
216            endline = srow - 1
217
218            # Check for obsolete features.
219            okfeatures = []
220            for f in features:
221                object = getattr(__future__, f, None)
222                if object is None:
223                    # A feature we don't know about yet -- leave it in.
224                    # They'll get a compile-time error when they compile
225                    # this program, but that's not our job to sort out.
226                    okfeatures.append(f)
227                else:
228                    released = object.getMandatoryRelease()
229                    if released is None or released <= sys.version_info:
230                        # Withdrawn or obsolete.
231                        pass
232                    else:
233                        okfeatures.append(f)
234
235            # Rewrite the line if at least one future-feature is obsolete.
236            if len(okfeatures) < len(features):
237                if len(okfeatures) == 0:
238                    line = None
239                else:
240                    line = "from __future__ import "
241                    line += ', '.join(okfeatures)
242                    if comment is not None:
243                        line += ' ' + comment
244                    line += '\n'
245                changed.append((startline, endline, line))
246
247            # Loop back for more future statements.
248
249        return changed
250
251    def gettherest(self):
252        if self.ateof:
253            self.therest = ''
254        else:
255            self.therest = self.f.read()
256
257    def write(self, f):
258        changed = self.changed
259        assert changed
260        # Prevent calling this again.
261        self.changed = []
262        # Apply changes in reverse order.
263        changed.reverse()
264        for s, e, line in changed:
265            if line is None:
266                # pure deletion
267                del self.lines[s:e+1]
268            else:
269                self.lines[s:e+1] = [line]
270        f.writelines(self.lines)
271        # Copy over the remainder of the file.
272        if self.therest:
273            f.write(self.therest)
274
275if __name__ == '__main__':
276    main()