~bzr-pqm/bzr/bzr.dev

1658.1.9 by Martin Pool
Give an error for bzr diff on an nonexistent file (Malone #3619)
1
# Copyright (C) 2004, 2005, 2006 Canonical Ltd.
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
2
#
1 by mbp at sourcefrog
import from baz patch-364
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
7
#
1 by mbp at sourcefrog
import from baz patch-364
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
12
#
1 by mbp at sourcefrog
import from baz patch-364
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
2520.4.140 by Aaron Bentley
Use matching blocks from mpdiff for knit delta creation
17
import difflib
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
18
import os
1899.1.5 by John Arbash Meinel
Always buffer the output of diff, so we can check if retcode==2 is because of Binary files
19
import re
1996.3.9 by John Arbash Meinel
lazy_import diff.py
20
import sys
21
22
from bzrlib.lazy_import import lazy_import
23
lazy_import(globals(), """
24
import errno
1692.8.7 by James Henstridge
changes suggested by John Meinel
25
import subprocess
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
26
import tempfile
1740.2.5 by Aaron Bentley
Merge from bzr.dev
27
import time
28
1955.2.10 by John Arbash Meinel
Unset a few other LANG type variables when spawning diff
29
from bzrlib import (
30
    errors,
31
    osutils,
1996.3.9 by John Arbash Meinel
lazy_import diff.py
32
    patiencediff,
33
    textfile,
1551.12.29 by Aaron Bentley
Copy and extend patch date formatting code, add patch-date parsing
34
    timestamp,
1955.2.10 by John Arbash Meinel
Unset a few other LANG type variables when spawning diff
35
    )
1996.3.9 by John Arbash Meinel
lazy_import diff.py
36
""")
37
38
from bzrlib.symbol_versioning import (
39
        deprecated_function,
40
        )
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
41
from bzrlib.trace import mutter, warning
1 by mbp at sourcefrog
import from baz patch-364
42
1711.2.24 by John Arbash Meinel
Late bind to PatienceSequenceMatcher to allow plugin to override.
43
767 by Martin Pool
- files are only reported as modified if their name or parent has changed,
44
# TODO: Rather than building a changeset object, we should probably
45
# invoke callbacks on an object.  That object can either accumulate a
46
# list, write them out directly, etc etc.
47
2520.4.140 by Aaron Bentley
Use matching blocks from mpdiff for knit delta creation
48
49
class _PrematchedMatcher(difflib.SequenceMatcher):
50
    """Allow SequenceMatcher operations to use predetermined blocks"""
51
52
    def __init__(self, matching_blocks):
53
        difflib.SequenceMatcher(self, None, None)
54
        self.matching_blocks = matching_blocks
55
        self.opcodes = None
56
57
1558.15.11 by Aaron Bentley
Apply merge review suggestions
58
def internal_diff(old_filename, oldlines, new_filename, newlines, to_file,
1711.2.30 by John Arbash Meinel
Fix bug in internal_diff handling of unicode paths
59
                  allow_binary=False, sequence_matcher=None,
60
                  path_encoding='utf8'):
475 by Martin Pool
- rewrite diff using compare_trees()
61
    # FIXME: difflib is wrong if there is no trailing newline.
62
    # The syntax used by patch seems to be "\ No newline at
63
    # end of file" following the last diff line from that
64
    # file.  This is not trivial to insert into the
65
    # unified_diff output and it might be better to just fix
66
    # or replace that function.
67
68
    # In the meantime we at least make sure the patch isn't
69
    # mangled.
70
71
72
    # Special workaround for Python2.3, where difflib fails if
73
    # both sequences are empty.
74
    if not oldlines and not newlines:
75
        return
1558.15.2 by Aaron Bentley
Implemented binary file handling for diff
76
    
1558.15.11 by Aaron Bentley
Apply merge review suggestions
77
    if allow_binary is False:
1996.3.9 by John Arbash Meinel
lazy_import diff.py
78
        textfile.check_text_lines(oldlines)
79
        textfile.check_text_lines(newlines)
475 by Martin Pool
- rewrite diff using compare_trees()
80
1185.81.8 by John Arbash Meinel
Updating unified_diff to take a factory, using the new diff algorithm in the code.
81
    if sequence_matcher is None:
1996.3.9 by John Arbash Meinel
lazy_import diff.py
82
        sequence_matcher = patiencediff.PatienceSequenceMatcher
83
    ud = patiencediff.unified_diff(oldlines, newlines,
1740.2.5 by Aaron Bentley
Merge from bzr.dev
84
                      fromfile=old_filename.encode(path_encoding),
85
                      tofile=new_filename.encode(path_encoding),
1185.81.8 by John Arbash Meinel
Updating unified_diff to take a factory, using the new diff algorithm in the code.
86
                      sequencematcher=sequence_matcher)
475 by Martin Pool
- rewrite diff using compare_trees()
87
1092.1.50 by Robert Collins
make diff lsdiff/filterdiff friendly
88
    ud = list(ud)
475 by Martin Pool
- rewrite diff using compare_trees()
89
    # work-around for difflib being too smart for its own good
90
    # if /dev/null is "1,0", patch won't recognize it as /dev/null
91
    if not oldlines:
92
        ud[2] = ud[2].replace('-1,0', '-0,0')
93
    elif not newlines:
94
        ud[2] = ud[2].replace('+1,0', '+0,0')
1092.1.50 by Robert Collins
make diff lsdiff/filterdiff friendly
95
    # work around for difflib emitting random spaces after the label
96
    ud[0] = ud[0][:-2] + '\n'
97
    ud[1] = ud[1][:-2] + '\n'
475 by Martin Pool
- rewrite diff using compare_trees()
98
804 by Martin Pool
Patch from John:
99
    for line in ud:
100
        to_file.write(line)
974.1.5 by Aaron Bentley
Fixed handling of missing newlines in udiffs
101
        if not line.endswith('\n'):
102
            to_file.write("\n\\ No newline at end of file\n")
2911.6.1 by Blake Winton
Change 'print >> f,'s to 'f.write('s.
103
    to_file.write('\n')
475 by Martin Pool
- rewrite diff using compare_trees()
104
105
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
106
def _spawn_external_diff(diffcmd, capture_errors=True):
107
    """Spawn the externall diff process, and return the child handle.
108
109
    :param diffcmd: The command list to spawn
2138.1.1 by Wouter van Heyst
Robuster external diff output handling.
110
    :param capture_errors: Capture stderr as well as setting LANG=C
111
        and LC_ALL=C. This lets us read and understand the output of diff,
112
        and respond to any errors.
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
113
    :return: A Popen object.
114
    """
115
    if capture_errors:
2321.2.2 by Alexander Belchenko
win32 fixes for test_external_diff_binary (gettext on win32 rely on $LANGUAGE)
116
        # construct minimal environment
117
        env = {}
118
        path = os.environ.get('PATH')
119
        if path is not None:
120
            env['PATH'] = path
2321.2.5 by Alexander Belchenko
external diff: no need for special code path for win32 (suggested by John Meinel)
121
        env['LANGUAGE'] = 'C'   # on win32 only LANGUAGE has effect
122
        env['LANG'] = 'C'
123
        env['LC_ALL'] = 'C'
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
124
        stderr = subprocess.PIPE
125
    else:
2321.2.2 by Alexander Belchenko
win32 fixes for test_external_diff_binary (gettext on win32 rely on $LANGUAGE)
126
        env = None
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
127
        stderr = None
128
129
    try:
130
        pipe = subprocess.Popen(diffcmd,
131
                                stdin=subprocess.PIPE,
132
                                stdout=subprocess.PIPE,
133
                                stderr=stderr,
2321.2.2 by Alexander Belchenko
win32 fixes for test_external_diff_binary (gettext on win32 rely on $LANGUAGE)
134
                                env=env)
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
135
    except OSError, e:
136
        if e.errno == errno.ENOENT:
137
            raise errors.NoDiff(str(e))
138
        raise
139
140
    return pipe
141
142
1185.35.29 by Aaron Bentley
Support whitespace in diff filenames
143
def external_diff(old_filename, oldlines, new_filename, newlines, to_file,
571 by Martin Pool
- new --diff-options to pass options through to external
144
                  diff_opts):
568 by Martin Pool
- start adding support for showing diffs by calling out to
145
    """Display a diff by calling out to the external diff program."""
581 by Martin Pool
- make sure any bzr output is flushed before
146
    # make sure our own output is properly ordered before the diff
147
    to_file.flush()
148
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
149
    oldtmp_fd, old_abspath = tempfile.mkstemp(prefix='bzr-diff-old-')
150
    newtmp_fd, new_abspath = tempfile.mkstemp(prefix='bzr-diff-new-')
151
    oldtmpf = os.fdopen(oldtmp_fd, 'wb')
152
    newtmpf = os.fdopen(newtmp_fd, 'wb')
568 by Martin Pool
- start adding support for showing diffs by calling out to
153
154
    try:
155
        # TODO: perhaps a special case for comparing to or from the empty
156
        # sequence; can just use /dev/null on Unix
157
158
        # TODO: if either of the files being compared already exists as a
159
        # regular named file (e.g. in the working directory) then we can
160
        # compare directly to that, rather than copying it.
161
162
        oldtmpf.writelines(oldlines)
163
        newtmpf.writelines(newlines)
164
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
165
        oldtmpf.close()
166
        newtmpf.close()
568 by Martin Pool
- start adding support for showing diffs by calling out to
167
571 by Martin Pool
- new --diff-options to pass options through to external
168
        if not diff_opts:
169
            diff_opts = []
170
        diffcmd = ['diff',
1740.2.5 by Aaron Bentley
Merge from bzr.dev
171
                   '--label', old_filename,
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
172
                   old_abspath,
1740.2.5 by Aaron Bentley
Merge from bzr.dev
173
                   '--label', new_filename,
1711.2.56 by John Arbash Meinel
Raise NoDiff if 'diff' not present.
174
                   new_abspath,
175
                   '--binary',
176
                  ]
571 by Martin Pool
- new --diff-options to pass options through to external
177
178
        # diff only allows one style to be specified; they don't override.
179
        # note that some of these take optargs, and the optargs can be
180
        # directly appended to the options.
181
        # this is only an approximate parser; it doesn't properly understand
182
        # the grammar.
183
        for s in ['-c', '-u', '-C', '-U',
184
                  '-e', '--ed',
185
                  '-q', '--brief',
186
                  '--normal',
187
                  '-n', '--rcs',
188
                  '-y', '--side-by-side',
189
                  '-D', '--ifdef']:
190
            for j in diff_opts:
191
                if j.startswith(s):
192
                    break
193
            else:
194
                continue
195
            break
196
        else:
197
            diffcmd.append('-u')
198
                  
199
        if diff_opts:
200
            diffcmd.extend(diff_opts)
201
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
202
        pipe = _spawn_external_diff(diffcmd, capture_errors=True)
203
        out,err = pipe.communicate()
204
        rc = pipe.returncode
571 by Martin Pool
- new --diff-options to pass options through to external
205
        
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
206
        # internal_diff() adds a trailing newline, add one here for consistency
207
        out += '\n'
1899.1.5 by John Arbash Meinel
Always buffer the output of diff, so we can check if retcode==2 is because of Binary files
208
        if rc == 2:
209
            # 'diff' gives retcode == 2 for all sorts of errors
210
            # one of those is 'Binary files differ'.
211
            # Bad options could also be the problem.
1904.1.4 by Marien Zwart
Make external diff in binary mode work with recent versions of diffutils.
212
            # 'Binary files' is not a real error, so we suppress that error.
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
213
            lang_c_out = out
214
215
            # Since we got here, we want to make sure to give an i18n error
216
            pipe = _spawn_external_diff(diffcmd, capture_errors=False)
217
            out, err = pipe.communicate()
218
219
            # Write out the new i18n diff response
220
            to_file.write(out+'\n')
221
            if pipe.returncode != 2:
1996.3.9 by John Arbash Meinel
lazy_import diff.py
222
                raise errors.BzrError(
223
                               'external diff failed with exit code 2'
2138.1.1 by Wouter van Heyst
Robuster external diff output handling.
224
                               ' when run with LANG=C and LC_ALL=C,'
225
                               ' but not when run natively: %r' % (diffcmd,))
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
226
227
            first_line = lang_c_out.split('\n', 1)[0]
1904.1.4 by Marien Zwart
Make external diff in binary mode work with recent versions of diffutils.
228
            # Starting with diffutils 2.8.4 the word "binary" was dropped.
229
            m = re.match('^(binary )?files.*differ$', first_line, re.I)
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
230
            if m is None:
1996.3.9 by John Arbash Meinel
lazy_import diff.py
231
                raise errors.BzrError('external diff failed with exit code 2;'
232
                                      ' command: %r' % (diffcmd,))
1920.1.1 by John Arbash Meinel
fix bug #56307, handle binary files even when LANG is not english
233
            else:
234
                # Binary files differ, just return
235
                return
236
237
        # If we got to here, we haven't written out the output of diff
238
        # do so now
239
        to_file.write(out)
240
        if rc not in (0, 1):
571 by Martin Pool
- new --diff-options to pass options through to external
241
            # returns 1 if files differ; that's OK
242
            if rc < 0:
243
                msg = 'signal %d' % (-rc)
244
            else:
245
                msg = 'exit code %d' % rc
246
                
1996.3.9 by John Arbash Meinel
lazy_import diff.py
247
            raise errors.BzrError('external diff failed with %s; command: %r' 
248
                                  % (rc, diffcmd))
1899.1.6 by John Arbash Meinel
internal_diff always adds a trailing \n, make sure external_diff does too
249
250
568 by Martin Pool
- start adding support for showing diffs by calling out to
251
    finally:
252
        oldtmpf.close()                 # and delete
253
        newtmpf.close()
1711.2.54 by John Arbash Meinel
Use mkstemp instead of NamedTemporary file for external diff.
254
        # Clean up. Warn in case the files couldn't be deleted
255
        # (in case windows still holds the file open, but not
256
        # if the files have already been deleted)
257
        try:
258
            os.remove(old_abspath)
259
        except OSError, e:
260
            if e.errno not in (errno.ENOENT,):
261
                warning('Failed to delete temporary file: %s %s',
262
                        old_abspath, e)
263
        try:
264
            os.remove(new_abspath)
265
        except OSError:
266
            if e.errno not in (errno.ENOENT,):
267
                warning('Failed to delete temporary file: %s %s',
268
                        new_abspath, e)
568 by Martin Pool
- start adding support for showing diffs by calling out to
269
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
270
1551.2.15 by Aaron Bentley
Rename cmd_show_diff to diff_cmd_helper
271
def diff_cmd_helper(tree, specific_files, external_diff_options, 
1684.1.6 by Martin Pool
(patch) --diff-prefix option (goffredo, alexander)
272
                    old_revision_spec=None, new_revision_spec=None,
2197.2.1 by Martin Pool
Refactor cmd_diff
273
                    revision_specs=None,
1684.1.6 by Martin Pool
(patch) --diff-prefix option (goffredo, alexander)
274
                    old_label='a/', new_label='b/'):
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
275
    """Helper for cmd_diff.
276
2197.2.1 by Martin Pool
Refactor cmd_diff
277
    :param tree:
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
278
        A WorkingTree
279
2197.2.1 by Martin Pool
Refactor cmd_diff
280
    :param specific_files:
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
281
        The specific files to compare, or None
282
2197.2.1 by Martin Pool
Refactor cmd_diff
283
    :param external_diff_options:
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
284
        If non-None, run an external diff, and pass it these options
285
2197.2.1 by Martin Pool
Refactor cmd_diff
286
    :param old_revision_spec:
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
287
        If None, use basis tree as old revision, otherwise use the tree for
288
        the specified revision. 
289
2197.2.1 by Martin Pool
Refactor cmd_diff
290
    :param new_revision_spec:
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
291
        If None, use working tree as new revision, otherwise use the tree for
292
        the specified revision.
293
    
2197.2.1 by Martin Pool
Refactor cmd_diff
294
    :param revision_specs: 
295
        Zero, one or two RevisionSpecs from the command line, saying what revisions 
296
        to compare.  This can be passed as an alternative to the old_revision_spec 
297
        and new_revision_spec parameters.
298
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
299
    The more general form is show_diff_trees(), where the caller
300
    supplies any two trees.
301
    """
2197.2.2 by Martin Pool
merge bzr.dev, reconcile with option changes
302
303
    # TODO: perhaps remove the old parameters old_revision_spec and
304
    # new_revision_spec, since this is only really for use from cmd_diff and
305
    # it now always passes through a sequence of revision_specs -- mbp
306
    # 20061221
307
1551.2.14 by Aaron Bentley
Updated argument names, DRY fixes.
308
    def spec_tree(spec):
1732.3.1 by Matthieu Moy
Implementation of -r revno:N:/path/to/branch
309
        if tree:
310
            revision = spec.in_store(tree.branch)
311
        else:
312
            revision = spec.in_store(None)
313
        revision_id = revision.rev_id
314
        branch = revision.branch
315
        return branch.repository.revision_tree(revision_id)
2197.2.1 by Martin Pool
Refactor cmd_diff
316
317
    if revision_specs is not None:
318
        assert (old_revision_spec is None
319
                and new_revision_spec is None)
320
        if len(revision_specs) > 0:
321
            old_revision_spec = revision_specs[0]
322
        if len(revision_specs) > 1:
323
            new_revision_spec = revision_specs[1]
324
1551.2.14 by Aaron Bentley
Updated argument names, DRY fixes.
325
    if old_revision_spec is None:
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
326
        old_tree = tree.basis_tree()
327
    else:
1551.2.14 by Aaron Bentley
Updated argument names, DRY fixes.
328
        old_tree = spec_tree(old_revision_spec)
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
329
2197.2.1 by Martin Pool
Refactor cmd_diff
330
    if (new_revision_spec is None
331
        or new_revision_spec.spec is None):
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
332
        new_tree = tree
333
    else:
1551.2.14 by Aaron Bentley
Updated argument names, DRY fixes.
334
        new_tree = spec_tree(new_revision_spec)
2197.2.1 by Martin Pool
Refactor cmd_diff
335
1551.7.19 by Aaron Bentley
Always include working tree when calculating file ids for diff
336
    if new_tree is not tree:
337
        extra_trees = (tree,)
338
    else:
339
        extra_trees = None
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
340
1551.2.14 by Aaron Bentley
Updated argument names, DRY fixes.
341
    return show_diff_trees(old_tree, new_tree, sys.stdout, specific_files,
1684.1.6 by Martin Pool
(patch) --diff-prefix option (goffredo, alexander)
342
                           external_diff_options,
1551.7.19 by Aaron Bentley
Always include working tree when calculating file ids for diff
343
                           old_label=old_label, new_label=new_label,
344
                           extra_trees=extra_trees)
1551.2.13 by Aaron Bentley
Got diff working properly with checkouts
345
571 by Martin Pool
- new --diff-options to pass options through to external
346
347
def show_diff_trees(old_tree, new_tree, to_file, specific_files=None,
1684.1.6 by Martin Pool
(patch) --diff-prefix option (goffredo, alexander)
348
                    external_diff_options=None,
1551.7.17 by Aaron Bentley
Switch to PathsNotVersioned, accept extra_trees
349
                    old_label='a/', new_label='b/',
2598.6.12 by ghigo
Move the encoding of the commit message at the command line level
350
                    extra_trees=None,
2598.6.16 by ghigo
Add the "replace" option to the encodeing of the path
351
                    path_encoding='utf8'):
550 by Martin Pool
- Refactor diff code into one that works purely on
352
    """Show in text form the changes from one tree to another.
353
354
    to_files
355
        If set, include only changes to these files.
571 by Martin Pool
- new --diff-options to pass options through to external
356
357
    external_diff_options
358
        If set, use an external GNU diff and pass these options.
1551.7.18 by Aaron Bentley
Indentation and documentation fixes
359
360
    extra_trees
361
        If set, more Trees to use for looking up file ids
2598.6.12 by ghigo
Move the encoding of the commit message at the command line level
362
363
    path_encoding
2598.6.24 by ghigo
update on the basis of Aaron suggestions
364
        If set, the path will be encoded as specified, otherwise is supposed
365
        to be utf8
550 by Martin Pool
- Refactor diff code into one that works purely on
366
    """
1543.1.1 by Denys Duchier
lock operations for trees - use them for diff
367
    old_tree.lock_read()
368
    try:
2255.7.38 by John Arbash Meinel
show_diff_trees() should lock any extra trees it is passed.
369
        if extra_trees is not None:
370
            for tree in extra_trees:
371
                tree.lock_read()
1543.1.1 by Denys Duchier
lock operations for trees - use them for diff
372
        new_tree.lock_read()
373
        try:
3009.2.22 by Aaron Bentley
Update names & docstring
374
            differ = DiffTree.from_trees_options(old_tree, new_tree, to_file,
3009.2.19 by Aaron Bentley
Implement directory diffing
375
                                                   path_encoding,
376
                                                   external_diff_options,
377
                                                   old_label, new_label)
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
378
            return differ.show_diff(specific_files, extra_trees)
1543.1.1 by Denys Duchier
lock operations for trees - use them for diff
379
        finally:
380
            new_tree.unlock()
2255.7.38 by John Arbash Meinel
show_diff_trees() should lock any extra trees it is passed.
381
            if extra_trees is not None:
382
                for tree in extra_trees:
383
                    tree.unlock()
1543.1.1 by Denys Duchier
lock operations for trees - use them for diff
384
    finally:
385
        old_tree.unlock()
386
387
1740.2.5 by Aaron Bentley
Merge from bzr.dev
388
def _patch_header_date(tree, file_id, path):
389
    """Returns a timestamp suitable for use in a patch header."""
2405.1.2 by John Arbash Meinel
Fix bug #103870 by passing None instead of a (sometimes wrong) path
390
    mtime = tree.get_file_mtime(file_id, path)
391
    assert mtime is not None, \
392
        "got an mtime of None for file-id %s, path %s in tree %s" % (
393
                file_id, path, tree)
394
    return timestamp.format_patch_date(mtime)
1740.2.5 by Aaron Bentley
Merge from bzr.dev
395
396
1662.1.9 by Martin Pool
Give a clear error for bzr status of an unversioned, nonexistent file. (Malone #3619)
397
def _raise_if_nonexistent(paths, old_tree, new_tree):
398
    """Complain if paths are not in either inventory or tree.
399
400
    It's OK with the files exist in either tree's inventory, or 
401
    if they exist in the tree but are not versioned.
402
    
403
    This can be used by operations such as bzr status that can accept
404
    unknown or ignored files.
405
    """
406
    mutter("check paths: %r", paths)
407
    if not paths:
408
        return
409
    s = old_tree.filter_unversioned_files(paths)
410
    s = new_tree.filter_unversioned_files(s)
411
    s = [path for path in s if not new_tree.has_filename(path)]
412
    if s:
413
        raise errors.PathsDoNotExist(sorted(s))
414
415
1398 by Robert Collins
integrate in Gustavos x-bit patch
416
def get_prop_change(meta_modified):
417
    if meta_modified:
418
        return " (properties changed)"
419
    else:
420
        return  ""
421
422
3009.2.22 by Aaron Bentley
Update names & docstring
423
class DiffPath(object):
3009.2.14 by Aaron Bentley
Update return type handling
424
    """Base type for command object that compare files"""
3009.2.17 by Aaron Bentley
Update docs
425
3009.2.14 by Aaron Bentley
Update return type handling
426
    # The type or contents of the file were unsuitable for diffing
3009.2.29 by Aaron Bentley
Change constants to strings
427
    CANNOT_DIFF = 'CANNOT_DIFF'
3009.2.14 by Aaron Bentley
Update return type handling
428
    # The file has changed in a semantic way
3009.2.29 by Aaron Bentley
Change constants to strings
429
    CHANGED = 'CHANGED'
430
    # The file content may have changed, but there is no semantic change
431
    UNCHANGED = 'UNCHANGED'
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
432
3009.2.13 by Aaron Bentley
Refactor differ to support registering differ factories
433
    def __init__(self, old_tree, new_tree, to_file, path_encoding='utf-8'):
3009.2.17 by Aaron Bentley
Update docs
434
        """Constructor.
435
436
        :param old_tree: The tree to show as the old tree in the comparison
437
        :param new_tree: The tree to show as new in the comparison
438
        :param to_file: The file to write comparison data to
439
        :param path_encoding: The character encoding to write paths in
440
        """
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
441
        self.old_tree = old_tree
442
        self.new_tree = new_tree
443
        self.to_file = to_file
3009.2.13 by Aaron Bentley
Refactor differ to support registering differ factories
444
        self.path_encoding = path_encoding
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
445
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
446
    @classmethod
447
    def from_diff_tree(klass, diff_tree):
448
        return klass(diff_tree.old_tree, diff_tree.new_tree,
449
                     diff_tree.to_file, diff_tree.path_encoding)
450
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
451
    @staticmethod
452
    def _diff_many(differs, file_id, old_path, new_path, old_kind, new_kind):
453
        for file_differ in differs:
454
            result = file_differ.diff(file_id, old_path, new_path, old_kind,
455
                                      new_kind)
3009.2.22 by Aaron Bentley
Update names & docstring
456
            if result is not DiffPath.CANNOT_DIFF:
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
457
                return result
458
        else:
3009.2.22 by Aaron Bentley
Update names & docstring
459
            return DiffPath.CANNOT_DIFF
460
461
462
class DiffKindChange(object):
3009.2.17 by Aaron Bentley
Update docs
463
    """Special differ for file kind changes.
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
464
3009.2.17 by Aaron Bentley
Update docs
465
    Represents kind change as deletion + creation.  Uses the other differs
466
    to do this.
467
    """
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
468
    def __init__(self, differs):
469
        self.differs = differs
470
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
471
    @classmethod
472
    def from_diff_tree(klass, diff_tree):
473
        return klass(diff_tree.differs)
474
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
475
    def diff(self, file_id, old_path, new_path, old_kind, new_kind):
3009.2.17 by Aaron Bentley
Update docs
476
        """Perform comparison
477
478
        :param file_id: The file_id of the file to compare
479
        :param old_path: Path of the file in the old tree
480
        :param new_path: Path of the file in the new tree
481
        :param old_kind: Old file-kind of the file
482
        :param new_kind: New file-kind of the file
483
        """
3009.2.18 by Aaron Bentley
Change KindChangeDiffer's anti-recursion to avoid kind pairs with None
484
        if None in (old_kind, new_kind):
3009.2.22 by Aaron Bentley
Update names & docstring
485
            return DiffPath.CANNOT_DIFF
486
        result = DiffPath._diff_many(self.differs, file_id, old_path,
3009.2.18 by Aaron Bentley
Change KindChangeDiffer's anti-recursion to avoid kind pairs with None
487
                                       new_path, old_kind, None)
3009.2.22 by Aaron Bentley
Update names & docstring
488
        if result is DiffPath.CANNOT_DIFF:
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
489
            return result
3009.2.22 by Aaron Bentley
Update names & docstring
490
        return DiffPath._diff_many(self.differs, file_id, old_path, new_path,
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
491
                                     None, new_kind)
492
493
3009.2.22 by Aaron Bentley
Update names & docstring
494
class DiffDirectory(DiffPath):
3009.2.19 by Aaron Bentley
Implement directory diffing
495
496
    def diff(self, file_id, old_path, new_path, old_kind, new_kind):
497
        """Perform comparison between two directories.  (dummy)
498
499
        """
500
        if 'directory' not in (old_kind, new_kind):
501
            return self.CANNOT_DIFF
502
        if old_kind not in ('directory', None):
503
            return self.CANNOT_DIFF
504
        if new_kind not in ('directory', None):
505
            return self.CANNOT_DIFF
506
        return self.CHANGED
507
3009.2.20 by Aaron Bentley
PEP8
508
3009.2.22 by Aaron Bentley
Update names & docstring
509
class DiffSymlink(DiffPath):
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
510
511
    def diff(self, file_id, old_path, new_path, old_kind, new_kind):
3009.2.17 by Aaron Bentley
Update docs
512
        """Perform comparison between two symlinks
513
514
        :param file_id: The file_id of the file to compare
515
        :param old_path: Path of the file in the old tree
516
        :param new_path: Path of the file in the new tree
517
        :param old_kind: Old file-kind of the file
518
        :param new_kind: New file-kind of the file
519
        """
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
520
        if 'symlink' not in (old_kind, new_kind):
3009.2.14 by Aaron Bentley
Update return type handling
521
            return self.CANNOT_DIFF
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
522
        if old_kind == 'symlink':
523
            old_target = self.old_tree.get_symlink_target(file_id)
524
        elif old_kind is None:
525
            old_target = None
526
        else:
3009.2.14 by Aaron Bentley
Update return type handling
527
            return self.CANNOT_DIFF
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
528
        if new_kind == 'symlink':
529
            new_target = self.new_tree.get_symlink_target(file_id)
530
        elif new_kind is None:
531
            new_target = None
532
        else:
3009.2.14 by Aaron Bentley
Update return type handling
533
            return self.CANNOT_DIFF
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
534
        return self.diff_symlink(old_target, new_target)
535
536
    def diff_symlink(self, old_target, new_target):
537
        if old_target is None:
538
            self.to_file.write('=== target is %r\n' % new_target)
539
        elif new_target is None:
540
            self.to_file.write('=== target was %r\n' % old_target)
541
        else:
542
            self.to_file.write('=== target changed %r => %r\n' %
543
                              (old_target, new_target))
3009.2.14 by Aaron Bentley
Update return type handling
544
        return self.CHANGED
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
545
546
3009.2.22 by Aaron Bentley
Update names & docstring
547
class DiffText(DiffPath):
3009.2.2 by Aaron Bentley
Implement Differ object for abstracting diffing
548
3009.2.7 by Aaron Bentley
Move responsibility for generating diff labels into Differ.diff
549
    # GNU Patch uses the epoch date to detect files that are being added
550
    # or removed in a diff.
551
    EPOCH_DATE = '1970-01-01 00:00:00 +0000'
552
3009.2.13 by Aaron Bentley
Refactor differ to support registering differ factories
553
    def __init__(self, old_tree, new_tree, to_file, path_encoding='utf-8',
554
                 old_label='', new_label='', text_differ=internal_diff):
3009.2.22 by Aaron Bentley
Update names & docstring
555
        DiffPath.__init__(self, old_tree, new_tree, to_file, path_encoding)
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
556
        self.text_differ = text_differ
557
        self.old_label = old_label
558
        self.new_label = new_label
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
559
        self.path_encoding = path_encoding
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
560
561
    def diff(self, file_id, old_path, new_path, old_kind, new_kind):
3009.2.17 by Aaron Bentley
Update docs
562
        """Compare two files in unified diff format
563
564
        :param file_id: The file_id of the file to compare
565
        :param old_path: Path of the file in the old tree
566
        :param new_path: Path of the file in the new tree
567
        :param old_kind: Old file-kind of the file
568
        :param new_kind: New file-kind of the file
569
        """
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
570
        if 'file' not in (old_kind, new_kind):
3009.2.14 by Aaron Bentley
Update return type handling
571
            return self.CANNOT_DIFF
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
572
        from_file_id = to_file_id = file_id
573
        if old_kind == 'file':
574
            old_date = _patch_header_date(self.old_tree, file_id, old_path)
575
        elif old_kind is None:
576
            old_date = self.EPOCH_DATE
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
577
            from_file_id = None
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
578
        else:
3009.2.14 by Aaron Bentley
Update return type handling
579
            return self.CANNOT_DIFF
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
580
        if new_kind == 'file':
581
            new_date = _patch_header_date(self.new_tree, file_id, new_path)
582
        elif new_kind is None:
583
            new_date = self.EPOCH_DATE
584
            to_file_id = None
585
        else:
3009.2.14 by Aaron Bentley
Update return type handling
586
            return self.CANNOT_DIFF
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
587
        from_label = '%s%s\t%s' % (self.old_label, old_path, old_date)
588
        to_label = '%s%s\t%s' % (self.new_label, new_path, new_date)
589
        return self.diff_text(from_file_id, to_file_id, from_label, to_label)
590
591
    def diff_text(self, from_file_id, to_file_id, from_label, to_label):
592
        """Diff the content of given files in two trees
593
594
        :param from_file_id: The id of the file in the from tree.  If None,
595
            the file is not present in the from tree.
596
        :param to_file_id: The id of the file in the to tree.  This may refer
597
            to a different file from from_file_id.  If None,
598
            the file is not present in the to tree.
599
        """
600
        def _get_text(tree, file_id):
601
            if file_id is not None:
602
                return tree.get_file(file_id).readlines()
603
            else:
604
                return []
605
        try:
606
            from_text = _get_text(self.old_tree, from_file_id)
607
            to_text = _get_text(self.new_tree, to_file_id)
608
            self.text_differ(from_label, from_text, to_label, to_text,
609
                             self.to_file)
610
        except errors.BinaryFile:
611
            self.to_file.write(
612
                  ("Binary files %s and %s differ\n" %
613
                  (from_label, to_label)).encode(self.path_encoding))
3009.2.14 by Aaron Bentley
Update return type handling
614
        return self.CHANGED
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
615
616
3009.2.22 by Aaron Bentley
Update names & docstring
617
class DiffTree(object):
618
    """Provides textual representations of the difference between two trees.
619
620
    A DiffTree examines two trees and where a file-id has altered
621
    between them, generates a textual representation of the difference.
622
    DiffTree uses a sequence of DiffPath objects which are each
623
    given the opportunity to handle a given altered fileid. The list
624
    of DiffPath objects can be extended globally by appending to
625
    DiffTree.diff_factories, or for a specific diff operation by
3009.2.27 by Aaron Bentley
Use extra_factories instead of extra_diffs
626
    supplying the extra_factories option to the appropriate method.
3009.2.22 by Aaron Bentley
Update names & docstring
627
    """
628
629
    # list of factories that can provide instances of DiffPath objects
3009.2.17 by Aaron Bentley
Update docs
630
    # may be extended by plugins.
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
631
    diff_factories = [DiffSymlink.from_diff_tree,
632
                      DiffDirectory.from_diff_tree]
3009.2.13 by Aaron Bentley
Refactor differ to support registering differ factories
633
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
634
    def __init__(self, old_tree, new_tree, to_file, path_encoding='utf-8',
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
635
                 diff_text=None, extra_factories=None):
3009.2.17 by Aaron Bentley
Update docs
636
        """Constructor
637
638
        :param old_tree: Tree to show as old in the comparison
639
        :param new_tree: Tree to show as new in the comparison
640
        :param to_file: File to write comparision to
641
        :param path_encoding: Character encoding to write paths in
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
642
        :param diff_text: DiffPath-type object to use as a last resort for
3009.2.17 by Aaron Bentley
Update docs
643
            diffing text files.
3009.2.27 by Aaron Bentley
Use extra_factories instead of extra_diffs
644
        :param extra_factories: Factories of DiffPaths to try before any other
645
            DiffPaths"""
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
646
        if diff_text is None:
647
            diff_text = DiffText(old_tree, new_tree, to_file, path_encoding,
648
                                 '', '',  internal_diff)
3009.2.4 by Aaron Bentley
Make old_tree/new_tree construction parameters of Differ
649
        self.old_tree = old_tree
650
        self.new_tree = new_tree
3009.2.2 by Aaron Bentley
Implement Differ object for abstracting diffing
651
        self.to_file = to_file
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
652
        self.path_encoding = path_encoding
3009.2.13 by Aaron Bentley
Refactor differ to support registering differ factories
653
        self.differs = []
3009.2.27 by Aaron Bentley
Use extra_factories instead of extra_diffs
654
        if extra_factories is not None:
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
655
            self.differs.extend(f(self) for f in extra_factories)
656
        self.differs.extend(f(self) for f in self.diff_factories)
657
        self.differs.extend([diff_text, DiffKindChange.from_diff_tree(self)])
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
658
659
    @classmethod
660
    def from_trees_options(klass, old_tree, new_tree, to_file,
3009.2.17 by Aaron Bentley
Update docs
661
                           path_encoding, external_diff_options, old_label,
662
                           new_label):
3009.2.22 by Aaron Bentley
Update names & docstring
663
        """Factory for producing a DiffTree.
3009.2.17 by Aaron Bentley
Update docs
664
665
        Designed to accept options used by show_diff_trees.
666
        :param old_tree: The tree to show as old in the comparison
667
        :param new_tree: The tree to show as new in the comparison
668
        :param to_file: File to write comparisons to
669
        :param path_encoding: Character encoding to use for writing paths
670
        :param external_diff_options: If supplied, use the installed diff
671
            binary to perform file comparison, using supplied options.
672
        :param old_label: Prefix to use for old file labels
673
        :param new_label: Prefix to use for new file labels
674
        """
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
675
        if external_diff_options:
676
            assert isinstance(external_diff_options, basestring)
677
            opts = external_diff_options.split()
678
            def diff_file(olab, olines, nlab, nlines, to_file):
679
                external_diff(olab, olines, nlab, nlines, to_file, opts)
680
        else:
681
            diff_file = internal_diff
3009.2.28 by Aaron Bentley
Add from_diff_tree factories
682
        diff_text = DiffText(old_tree, new_tree, to_file, path_encoding,
683
                             old_label, new_label, diff_file)
684
        return klass(old_tree, new_tree, to_file, path_encoding, diff_text)
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
685
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
686
    def show_diff(self, specific_files, extra_trees=None):
3009.2.17 by Aaron Bentley
Update docs
687
        """Write tree diff to self.to_file
688
689
        :param sepecific_files: the specific files to compare (recursive)
690
        :param extra_trees: extra trees to use for mapping paths to file_ids
691
        """
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
692
        # TODO: Generation of pseudo-diffs for added/deleted files could
693
        # be usefully made into a much faster special case.
694
695
        delta = self.new_tree.changes_from(self.old_tree,
696
            specific_files=specific_files,
697
            extra_trees=extra_trees, require_versioned=True)
698
699
        has_changes = 0
700
        for path, file_id, kind in delta.removed:
701
            has_changes = 1
702
            path_encoded = path.encode(self.path_encoding, "replace")
703
            self.to_file.write("=== removed %s '%s'\n" % (kind, path_encoded))
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
704
            self.diff(file_id, path, path)
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
705
706
        for path, file_id, kind in delta.added:
707
            has_changes = 1
708
            path_encoded = path.encode(self.path_encoding, "replace")
709
            self.to_file.write("=== added %s '%s'\n" % (kind, path_encoded))
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
710
            self.diff(file_id, path, path)
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
711
        for (old_path, new_path, file_id, kind,
712
             text_modified, meta_modified) in delta.renamed:
713
            has_changes = 1
714
            prop_str = get_prop_change(meta_modified)
715
            oldpath_encoded = old_path.encode(self.path_encoding, "replace")
716
            newpath_encoded = new_path.encode(self.path_encoding, "replace")
717
            self.to_file.write("=== renamed %s '%s' => '%s'%s\n" % (kind,
718
                                oldpath_encoded, newpath_encoded, prop_str))
3009.2.7 by Aaron Bentley
Move responsibility for generating diff labels into Differ.diff
719
            if text_modified:
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
720
                self.diff(file_id, old_path, new_path)
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
721
        for path, file_id, kind, text_modified, meta_modified in\
722
            delta.modified:
723
            has_changes = 1
724
            prop_str = get_prop_change(meta_modified)
725
            path_encoded = path.encode(self.path_encoding, "replace")
726
            self.to_file.write("=== modified %s '%s'%s\n" % (kind,
727
                                path_encoded, prop_str))
728
            # The file may be in a different location in the old tree (because
729
            # the containing dir was renamed, but the file itself was not)
730
            if text_modified:
3009.2.7 by Aaron Bentley
Move responsibility for generating diff labels into Differ.diff
731
                old_path = self.old_tree.id2path(file_id)
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
732
                self.diff(file_id, old_path, path)
3009.2.6 by Aaron Bentley
Convert show_diff_trees into a Differ method
733
        return has_changes
3009.2.2 by Aaron Bentley
Implement Differ object for abstracting diffing
734
3009.2.12 by Aaron Bentley
Associate labels with text diffing only
735
    def diff(self, file_id, old_path, new_path):
3009.2.17 by Aaron Bentley
Update docs
736
        """Perform a diff of a single file
737
738
        :param file_id: file-id of the file
739
        :param old_path: The path of the file in the old tree
740
        :param new_path: The path of the file in the new tree
741
        """
3009.2.2 by Aaron Bentley
Implement Differ object for abstracting diffing
742
        try:
3009.2.8 by Aaron Bentley
Support diffing without indirecting through inventory entries
743
            old_kind = self.old_tree.kind(file_id)
3009.2.2 by Aaron Bentley
Implement Differ object for abstracting diffing
744
        except errors.NoSuchId:
3009.2.8 by Aaron Bentley
Support diffing without indirecting through inventory entries
745
            old_kind = None
3009.2.3 by Aaron Bentley
Detect missing files from inv operation
746
        try:
3009.2.8 by Aaron Bentley
Support diffing without indirecting through inventory entries
747
            new_kind = self.new_tree.kind(file_id)
3009.2.3 by Aaron Bentley
Detect missing files from inv operation
748
        except errors.NoSuchId:
3009.2.8 by Aaron Bentley
Support diffing without indirecting through inventory entries
749
            new_kind = None
3009.2.7 by Aaron Bentley
Move responsibility for generating diff labels into Differ.diff
750
3009.2.22 by Aaron Bentley
Update names & docstring
751
        result = DiffPath._diff_many(self.differs, file_id, old_path,
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
752
                                       new_path, old_kind, new_kind)
3009.2.22 by Aaron Bentley
Update names & docstring
753
        if result is DiffPath.CANNOT_DIFF:
3009.2.11 by Aaron Bentley
Refactor diff to be more pluggable
754
            error_path = new_path
755
            if error_path is None:
756
                error_path = old_path
3009.2.22 by Aaron Bentley
Update names & docstring
757
            raise errors.NoDiffFound(error_path)