~bzr-pqm/bzr/bzr.dev

1 by mbp at sourcefrog
import from baz patch-364
1
#! /usr/bin/env python
2
# -*- coding: UTF-8 -*-
3
4
# This program is free software; you can redistribute it and/or modify
5
# it under the terms of the GNU General Public License as published by
6
# the Free Software Foundation; either version 2 of the License, or
7
# (at your option) any later version.
8
9
# This program is distributed in the hope that it will be useful,
10
# but WITHOUT ANY WARRANTY; without even the implied warranty of
11
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12
# GNU General Public License for more details.
13
14
# You should have received a copy of the GNU General Public License
15
# along with this program; if not, write to the Free Software
16
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
17
18
from trace import mutter
356 by Martin Pool
- pychecker fixes in bzrlib.diff
19
from errors import BzrError
1 by mbp at sourcefrog
import from baz patch-364
20
21
767 by Martin Pool
- files are only reported as modified if their name or parent has changed,
22
# TODO: Rather than building a changeset object, we should probably
23
# invoke callbacks on an object.  That object can either accumulate a
24
# list, write them out directly, etc etc.
25
568 by Martin Pool
- start adding support for showing diffs by calling out to
26
def internal_diff(old_label, oldlines, new_label, newlines, to_file):
475 by Martin Pool
- rewrite diff using compare_trees()
27
    import difflib
28
    
29
    # FIXME: difflib is wrong if there is no trailing newline.
30
    # The syntax used by patch seems to be "\ No newline at
31
    # end of file" following the last diff line from that
32
    # file.  This is not trivial to insert into the
33
    # unified_diff output and it might be better to just fix
34
    # or replace that function.
35
36
    # In the meantime we at least make sure the patch isn't
37
    # mangled.
38
39
40
    # Special workaround for Python2.3, where difflib fails if
41
    # both sequences are empty.
42
    if not oldlines and not newlines:
43
        return
44
45
    nonl = False
46
47
    if oldlines and (oldlines[-1][-1] != '\n'):
48
        oldlines[-1] += '\n'
49
        nonl = True
50
    if newlines and (newlines[-1][-1] != '\n'):
51
        newlines[-1] += '\n'
52
        nonl = True
53
568 by Martin Pool
- start adding support for showing diffs by calling out to
54
    ud = difflib.unified_diff(oldlines, newlines,
55
                              fromfile=old_label, tofile=new_label)
475 by Martin Pool
- rewrite diff using compare_trees()
56
57
    # work-around for difflib being too smart for its own good
58
    # if /dev/null is "1,0", patch won't recognize it as /dev/null
59
    if not oldlines:
60
        ud = list(ud)
61
        ud[2] = ud[2].replace('-1,0', '-0,0')
62
    elif not newlines:
63
        ud = list(ud)
64
        ud[2] = ud[2].replace('+1,0', '+0,0')
65
66
    to_file.writelines(ud)
67
    if nonl:
68
        print >>to_file, "\\ No newline at end of file"
69
    print >>to_file
70
71
550 by Martin Pool
- Refactor diff code into one that works purely on
72
568 by Martin Pool
- start adding support for showing diffs by calling out to
73
571 by Martin Pool
- new --diff-options to pass options through to external
74
def external_diff(old_label, oldlines, new_label, newlines, to_file,
75
                  diff_opts):
568 by Martin Pool
- start adding support for showing diffs by calling out to
76
    """Display a diff by calling out to the external diff program."""
77
    import sys
78
    
79
    if to_file != sys.stdout:
80
        raise NotImplementedError("sorry, can't send external diff other than to stdout yet",
81
                                  to_file)
82
581 by Martin Pool
- make sure any bzr output is flushed before
83
    # make sure our own output is properly ordered before the diff
84
    to_file.flush()
85
568 by Martin Pool
- start adding support for showing diffs by calling out to
86
    from tempfile import NamedTemporaryFile
571 by Martin Pool
- new --diff-options to pass options through to external
87
    import os
568 by Martin Pool
- start adding support for showing diffs by calling out to
88
89
    oldtmpf = NamedTemporaryFile()
90
    newtmpf = NamedTemporaryFile()
91
92
    try:
93
        # TODO: perhaps a special case for comparing to or from the empty
94
        # sequence; can just use /dev/null on Unix
95
96
        # TODO: if either of the files being compared already exists as a
97
        # regular named file (e.g. in the working directory) then we can
98
        # compare directly to that, rather than copying it.
99
100
        oldtmpf.writelines(oldlines)
101
        newtmpf.writelines(newlines)
102
103
        oldtmpf.flush()
104
        newtmpf.flush()
105
571 by Martin Pool
- new --diff-options to pass options through to external
106
        if not diff_opts:
107
            diff_opts = []
108
        diffcmd = ['diff',
109
                   '--label', old_label,
110
                   oldtmpf.name,
111
                   '--label', new_label,
112
                   newtmpf.name]
113
114
        # diff only allows one style to be specified; they don't override.
115
        # note that some of these take optargs, and the optargs can be
116
        # directly appended to the options.
117
        # this is only an approximate parser; it doesn't properly understand
118
        # the grammar.
119
        for s in ['-c', '-u', '-C', '-U',
120
                  '-e', '--ed',
121
                  '-q', '--brief',
122
                  '--normal',
123
                  '-n', '--rcs',
124
                  '-y', '--side-by-side',
125
                  '-D', '--ifdef']:
126
            for j in diff_opts:
127
                if j.startswith(s):
128
                    break
129
            else:
130
                continue
131
            break
132
        else:
133
            diffcmd.append('-u')
134
                  
135
        if diff_opts:
136
            diffcmd.extend(diff_opts)
137
138
        rc = os.spawnvp(os.P_WAIT, 'diff', diffcmd)
139
        
140
        if rc != 0 and rc != 1:
141
            # returns 1 if files differ; that's OK
142
            if rc < 0:
143
                msg = 'signal %d' % (-rc)
144
            else:
145
                msg = 'exit code %d' % rc
146
                
147
            raise BzrError('external diff failed with %s; command: %r' % (rc, diffcmd))
568 by Martin Pool
- start adding support for showing diffs by calling out to
148
    finally:
149
        oldtmpf.close()                 # and delete
150
        newtmpf.close()
151
    
152
153
571 by Martin Pool
- new --diff-options to pass options through to external
154
def show_diff(b, revision, specific_files, external_diff_options=None):
619 by Martin Pool
doc
155
    """Shortcut for showing the diff to the working tree.
156
157
    b
158
        Branch.
159
160
    revision
161
        None for each, or otherwise the old revision to compare against.
162
    
163
    The more general form is show_diff_trees(), where the caller
164
    supplies any two trees.
165
    """
475 by Martin Pool
- rewrite diff using compare_trees()
166
    import sys
167
329 by Martin Pool
- refactor command functions into command classes
168
    if revision == None:
169
        old_tree = b.basis_tree()
170
    else:
171
        old_tree = b.revision_tree(b.lookup_revision(revision))
172
        
173
    new_tree = b.working_tree()
174
571 by Martin Pool
- new --diff-options to pass options through to external
175
    show_diff_trees(old_tree, new_tree, sys.stdout, specific_files,
176
                    external_diff_options)
177
178
179
180
def show_diff_trees(old_tree, new_tree, to_file, specific_files=None,
181
                    external_diff_options=None):
550 by Martin Pool
- Refactor diff code into one that works purely on
182
    """Show in text form the changes from one tree to another.
183
184
    to_files
185
        If set, include only changes to these files.
571 by Martin Pool
- new --diff-options to pass options through to external
186
187
    external_diff_options
188
        If set, use an external GNU diff and pass these options.
550 by Martin Pool
- Refactor diff code into one that works purely on
189
    """
190
329 by Martin Pool
- refactor command functions into command classes
191
    # TODO: Options to control putting on a prefix or suffix, perhaps as a format string
192
    old_label = ''
193
    new_label = ''
194
195
    DEVNULL = '/dev/null'
196
    # Windows users, don't panic about this filename -- it is a
197
    # special signal to GNU patch that the file should be created or
198
    # deleted respectively.
199
200
    # TODO: Generation of pseudo-diffs for added/deleted files could
201
    # be usefully made into a much faster special case.
202
571 by Martin Pool
- new --diff-options to pass options through to external
203
    if external_diff_options:
204
        assert isinstance(external_diff_options, basestring)
205
        opts = external_diff_options.split()
206
        def diff_file(olab, olines, nlab, nlines, to_file):
207
            external_diff(olab, olines, nlab, nlines, to_file, opts)
208
    else:
209
        diff_file = internal_diff
210
    
211
478 by Martin Pool
- put back support for running diff or status on
212
    delta = compare_trees(old_tree, new_tree, want_unchanged=False,
483 by Martin Pool
- change 'file_list' to more explanatory 'specific_files'
213
                          specific_files=specific_files)
475 by Martin Pool
- rewrite diff using compare_trees()
214
215
    for path, file_id, kind in delta.removed:
643 by Martin Pool
- fix redirection of messages to file in diff
216
        print >>to_file, '*** removed %s %r' % (kind, path)
475 by Martin Pool
- rewrite diff using compare_trees()
217
        if kind == 'file':
568 by Martin Pool
- start adding support for showing diffs by calling out to
218
            diff_file(old_label + path,
219
                      old_tree.get_file(file_id).readlines(),
220
                      DEVNULL, 
221
                      [],
222
                      to_file)
475 by Martin Pool
- rewrite diff using compare_trees()
223
224
    for path, file_id, kind in delta.added:
643 by Martin Pool
- fix redirection of messages to file in diff
225
        print >>to_file, '*** added %s %r' % (kind, path)
475 by Martin Pool
- rewrite diff using compare_trees()
226
        if kind == 'file':
568 by Martin Pool
- start adding support for showing diffs by calling out to
227
            diff_file(DEVNULL,
228
                      [],
229
                      new_label + path,
230
                      new_tree.get_file(file_id).readlines(),
231
                      to_file)
475 by Martin Pool
- rewrite diff using compare_trees()
232
233
    for old_path, new_path, file_id, kind, text_modified in delta.renamed:
643 by Martin Pool
- fix redirection of messages to file in diff
234
        print >>to_file, '*** renamed %s %r => %r' % (kind, old_path, new_path)
475 by Martin Pool
- rewrite diff using compare_trees()
235
        if text_modified:
568 by Martin Pool
- start adding support for showing diffs by calling out to
236
            diff_file(old_label + old_path,
237
                      old_tree.get_file(file_id).readlines(),
238
                      new_label + new_path,
239
                      new_tree.get_file(file_id).readlines(),
240
                      to_file)
475 by Martin Pool
- rewrite diff using compare_trees()
241
242
    for path, file_id, kind in delta.modified:
643 by Martin Pool
- fix redirection of messages to file in diff
243
        print >>to_file, '*** modified %s %r' % (kind, path)
475 by Martin Pool
- rewrite diff using compare_trees()
244
        if kind == 'file':
568 by Martin Pool
- start adding support for showing diffs by calling out to
245
            diff_file(old_label + path,
246
                      old_tree.get_file(file_id).readlines(),
247
                      new_label + path,
248
                      new_tree.get_file(file_id).readlines(),
249
                      to_file)
329 by Martin Pool
- refactor command functions into command classes
250
251
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
252
558 by Martin Pool
- All top-level classes inherit from object
253
class TreeDelta(object):
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
254
    """Describes changes from one tree to another.
255
256
    Contains four lists:
257
258
    added
475 by Martin Pool
- rewrite diff using compare_trees()
259
        (path, id, kind)
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
260
    removed
475 by Martin Pool
- rewrite diff using compare_trees()
261
        (path, id, kind)
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
262
    renamed
475 by Martin Pool
- rewrite diff using compare_trees()
263
        (oldpath, newpath, id, kind, text_modified)
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
264
    modified
475 by Martin Pool
- rewrite diff using compare_trees()
265
        (path, id, kind)
463 by Martin Pool
- compare_trees() also reports unchanged files
266
    unchanged
475 by Martin Pool
- rewrite diff using compare_trees()
267
        (path, id, kind)
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
268
460 by Martin Pool
- new testing command compare-trees
269
    Each id is listed only once.
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
270
460 by Martin Pool
- new testing command compare-trees
271
    Files that are both modified and renamed are listed only in
272
    renamed, with the text_modified flag true.
463 by Martin Pool
- compare_trees() also reports unchanged files
273
767 by Martin Pool
- files are only reported as modified if their name or parent has changed,
274
    Files are only considered renamed if their name has changed or
275
    their parent directory has changed.  Renaming a directory
276
    does not count as renaming all its contents.
277
463 by Martin Pool
- compare_trees() also reports unchanged files
278
    The lists are normally sorted when the delta is created.
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
279
    """
280
    def __init__(self):
281
        self.added = []
282
        self.removed = []
283
        self.renamed = []
284
        self.modified = []
463 by Martin Pool
- compare_trees() also reports unchanged files
285
        self.unchanged = []
379 by Martin Pool
- Simpler compare_inventories() to possibly replace diff_trees
286
747 by Martin Pool
- TreeDelta __eq__ and __ne__ methods
287
    def __eq__(self, other):
288
        if not isinstance(other, TreeDelta):
289
            return False
290
        return self.added == other.added \
291
               and self.removed == other.removed \
292
               and self.renamed == other.renamed \
293
               and self.modified == other.modified \
294
               and self.unchanged == other.unchanged
295
296
    def __ne__(self, other):
297
        return not (self == other)
298
639 by Martin Pool
- add TreeDelta repr
299
    def __repr__(self):
300
        return "TreeDelta(added=%r, removed=%r, renamed=%r, modified=%r," \
301
            " unchanged=%r)" % (self.added, self.removed, self.renamed,
302
            self.modified, self.unchanged)
303
622 by Martin Pool
Updated merge patch from Aaron
304
    def has_changed(self):
305
        changes = len(self.added) + len(self.removed) + len(self.renamed)
306
        changes += len(self.modified) 
307
        return (changes != 0)
531 by Martin Pool
- new utility TreeDelta.touches_file_id
308
309
    def touches_file_id(self, file_id):
310
        """Return True if file_id is modified by this delta."""
311
        for l in self.added, self.removed, self.modified:
312
            for v in l:
313
                if v[1] == file_id:
314
                    return True
315
        for v in self.renamed:
316
            if v[2] == file_id:
317
                return True
318
        return False
319
            
320
465 by Martin Pool
- Move show_status() out of Branch into a new function in
321
    def show(self, to_file, show_ids=False, show_unchanged=False):
322
        def show_list(files):
475 by Martin Pool
- rewrite diff using compare_trees()
323
            for path, fid, kind in files:
324
                if kind == 'directory':
325
                    path += '/'
326
                elif kind == 'symlink':
327
                    path += '@'
328
                    
465 by Martin Pool
- Move show_status() out of Branch into a new function in
329
                if show_ids:
330
                    print >>to_file, '  %-30s %s' % (path, fid)
331
                else:
332
                    print >>to_file, ' ', path
333
            
460 by Martin Pool
- new testing command compare-trees
334
        if self.removed:
475 by Martin Pool
- rewrite diff using compare_trees()
335
            print >>to_file, 'removed:'
465 by Martin Pool
- Move show_status() out of Branch into a new function in
336
            show_list(self.removed)
337
                
460 by Martin Pool
- new testing command compare-trees
338
        if self.added:
475 by Martin Pool
- rewrite diff using compare_trees()
339
            print >>to_file, 'added:'
465 by Martin Pool
- Move show_status() out of Branch into a new function in
340
            show_list(self.added)
341
460 by Martin Pool
- new testing command compare-trees
342
        if self.renamed:
475 by Martin Pool
- rewrite diff using compare_trees()
343
            print >>to_file, 'renamed:'
344
            for oldpath, newpath, fid, kind, text_modified in self.renamed:
460 by Martin Pool
- new testing command compare-trees
345
                if show_ids:
346
                    print >>to_file, '  %s => %s %s' % (oldpath, newpath, fid)
347
                else:
348
                    print >>to_file, '  %s => %s' % (oldpath, newpath)
465 by Martin Pool
- Move show_status() out of Branch into a new function in
349
                    
460 by Martin Pool
- new testing command compare-trees
350
        if self.modified:
475 by Martin Pool
- rewrite diff using compare_trees()
351
            print >>to_file, 'modified:'
465 by Martin Pool
- Move show_status() out of Branch into a new function in
352
            show_list(self.modified)
353
            
354
        if show_unchanged and self.unchanged:
475 by Martin Pool
- rewrite diff using compare_trees()
355
            print >>to_file, 'unchanged:'
465 by Martin Pool
- Move show_status() out of Branch into a new function in
356
            show_list(self.unchanged)
460 by Martin Pool
- new testing command compare-trees
357
358
359
746 by Martin Pool
- compare_trees doesn't return unchanged files by default
360
def compare_trees(old_tree, new_tree, want_unchanged=False, specific_files=None):
478 by Martin Pool
- put back support for running diff or status on
361
    """Describe changes from one tree to another.
362
363
    Returns a TreeDelta with details of added, modified, renamed, and
364
    deleted entries.
365
366
    The root entry is specifically exempt.
367
368
    This only considers versioned files.
369
370
    want_unchanged
485 by Martin Pool
- move commit code into its own module
371
        If true, also list files unchanged from one version to
372
        the next.
478 by Martin Pool
- put back support for running diff or status on
373
483 by Martin Pool
- change 'file_list' to more explanatory 'specific_files'
374
    specific_files
485 by Martin Pool
- move commit code into its own module
375
        If true, only check for changes to specified names or
376
        files within them.
478 by Martin Pool
- put back support for running diff or status on
377
    """
485 by Martin Pool
- move commit code into its own module
378
379
    from osutils import is_inside_any
380
    
460 by Martin Pool
- new testing command compare-trees
381
    old_inv = old_tree.inventory
382
    new_inv = new_tree.inventory
383
    delta = TreeDelta()
475 by Martin Pool
- rewrite diff using compare_trees()
384
    mutter('start compare_trees')
478 by Martin Pool
- put back support for running diff or status on
385
485 by Martin Pool
- move commit code into its own module
386
    # TODO: match for specific files can be rather smarter by finding
387
    # the IDs of those files up front and then considering only that.
478 by Martin Pool
- put back support for running diff or status on
388
462 by Martin Pool
- New form 'file_id in tree' to check if the file is present
389
    for file_id in old_tree:
390
        if file_id in new_tree:
460 by Martin Pool
- new testing command compare-trees
391
            kind = old_inv.get_file_kind(file_id)
475 by Martin Pool
- rewrite diff using compare_trees()
392
            assert kind == new_inv.get_file_kind(file_id)
393
            
460 by Martin Pool
- new testing command compare-trees
394
            assert kind in ('file', 'directory', 'symlink', 'root_directory'), \
395
                   'invalid file kind %r' % kind
477 by Martin Pool
- fix header for listing of unknown files
396
397
            if kind == 'root_directory':
398
                continue
399
            
400
            old_path = old_inv.id2path(file_id)
401
            new_path = new_inv.id2path(file_id)
402
767 by Martin Pool
- files are only reported as modified if their name or parent has changed,
403
            old_ie = old_inv[file_id]
404
            new_ie = new_inv[file_id]
405
483 by Martin Pool
- change 'file_list' to more explanatory 'specific_files'
406
            if specific_files:
485 by Martin Pool
- move commit code into its own module
407
                if (not is_inside_any(specific_files, old_path) 
408
                    and not is_inside_any(specific_files, new_path)):
478 by Martin Pool
- put back support for running diff or status on
409
                    continue
410
460 by Martin Pool
- new testing command compare-trees
411
            if kind == 'file':
412
                old_sha1 = old_tree.get_file_sha1(file_id)
413
                new_sha1 = new_tree.get_file_sha1(file_id)
414
                text_modified = (old_sha1 != new_sha1)
415
            else:
416
                ## mutter("no text to check for %r %r" % (file_id, kind))
417
                text_modified = False
471 by Martin Pool
- actually avoid reporting unchanged files if not required
418
419
            # TODO: Can possibly avoid calculating path strings if the
420
            # two files are unchanged and their names and parents are
421
            # the same and the parents are unchanged all the way up.
422
            # May not be worthwhile.
460 by Martin Pool
- new testing command compare-trees
423
            
767 by Martin Pool
- files are only reported as modified if their name or parent has changed,
424
            if (old_ie.name != new_ie.name
425
                or old_ie.parent_id != new_ie.parent_id):
475 by Martin Pool
- rewrite diff using compare_trees()
426
                delta.renamed.append((old_path, new_path, file_id, kind,
427
                                      text_modified))
460 by Martin Pool
- new testing command compare-trees
428
            elif text_modified:
475 by Martin Pool
- rewrite diff using compare_trees()
429
                delta.modified.append((new_path, file_id, kind))
471 by Martin Pool
- actually avoid reporting unchanged files if not required
430
            elif want_unchanged:
475 by Martin Pool
- rewrite diff using compare_trees()
431
                delta.unchanged.append((new_path, file_id, kind))
460 by Martin Pool
- new testing command compare-trees
432
        else:
566 by Martin Pool
- fix bug in reporting diffs between trees where files have
433
            kind = old_inv.get_file_kind(file_id)
485 by Martin Pool
- move commit code into its own module
434
            old_path = old_inv.id2path(file_id)
435
            if specific_files:
436
                if not is_inside_any(specific_files, old_path):
437
                    continue
438
            delta.removed.append((old_path, file_id, kind))
475 by Martin Pool
- rewrite diff using compare_trees()
439
440
    mutter('start looking for new files')
460 by Martin Pool
- new testing command compare-trees
441
    for file_id in new_inv:
442
        if file_id in old_inv:
443
            continue
478 by Martin Pool
- put back support for running diff or status on
444
        new_path = new_inv.id2path(file_id)
483 by Martin Pool
- change 'file_list' to more explanatory 'specific_files'
445
        if specific_files:
485 by Martin Pool
- move commit code into its own module
446
            if not is_inside_any(specific_files, new_path):
478 by Martin Pool
- put back support for running diff or status on
447
                continue
475 by Martin Pool
- rewrite diff using compare_trees()
448
        kind = new_inv.get_file_kind(file_id)
478 by Martin Pool
- put back support for running diff or status on
449
        delta.added.append((new_path, file_id, kind))
460 by Martin Pool
- new testing command compare-trees
450
            
451
    delta.removed.sort()
452
    delta.added.sort()
453
    delta.renamed.sort()
454
    delta.modified.sort()
474 by Martin Pool
- sort unchanged files
455
    delta.unchanged.sort()
460 by Martin Pool
- new testing command compare-trees
456
457
    return delta