~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/workingtree_4.py

  • Committer: John Arbash Meinel
  • Date: 2008-07-17 03:46:13 UTC
  • mto: This revision was merged to the branch mainline in revision 3557.
  • Revision ID: john@arbash-meinel.com-20080717034613-3cqwmu9mfshqwyet
Some code cleanups.

Remove extra comments.
Use 64 bit integer math when possible.
Use PyList_Append rather than foo.append()
Use PyUnicode_AsUTF8String rather than codecs.encode()
Make sure to raise an exception if the target directory doesn't exist.
Seems to have made a significant performance impact.

Show diffs side-by-side

added added

removed removed

Lines of Context:
1
 
# Copyright (C) 2007-2010 Canonical Ltd
 
1
# Copyright (C) 2005, 2006, 2007 Canonical Ltd
2
2
#
3
3
# This program is free software; you can redistribute it and/or modify
4
4
# it under the terms of the GNU General Public License as published by
12
12
#
13
13
# You should have received a copy of the GNU General Public License
14
14
# along with this program; if not, write to the Free Software
15
 
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
16
 
17
17
"""WorkingTree4 format and implementation.
18
18
 
28
28
 
29
29
from bzrlib.lazy_import import lazy_import
30
30
lazy_import(globals(), """
 
31
from bisect import bisect_left
 
32
import collections
 
33
from copy import deepcopy
31
34
import errno
 
35
import itertools
 
36
import operator
32
37
import stat
 
38
from time import time
 
39
import warnings
33
40
 
34
41
import bzrlib
35
42
from bzrlib import (
36
43
    bzrdir,
37
44
    cache_utf8,
 
45
    conflicts as _mod_conflicts,
38
46
    debug,
 
47
    delta,
39
48
    dirstate,
40
49
    errors,
41
50
    generate_ids,
 
51
    globbing,
 
52
    ignores,
 
53
    merge,
42
54
    osutils,
43
55
    revision as _mod_revision,
44
56
    revisiontree,
 
57
    textui,
45
58
    trace,
46
59
    transform,
47
 
    views,
 
60
    urlutils,
 
61
    xml5,
 
62
    xml6,
48
63
    )
49
64
import bzrlib.branch
 
65
from bzrlib.transport import get_transport
50
66
import bzrlib.ui
51
67
""")
52
68
 
 
69
from bzrlib import symbol_versioning
53
70
from bzrlib.decorators import needs_read_lock, needs_write_lock
54
 
from bzrlib.filters import filtered_input_file, internal_size_sha_file_byname
55
 
from bzrlib.inventory import Inventory, ROOT_ID, entry_factory
 
71
from bzrlib.inventory import InventoryEntry, Inventory, ROOT_ID, entry_factory
 
72
from bzrlib.lockable_files import LockableFiles, TransportLock
 
73
from bzrlib.lockdir import LockDir
 
74
import bzrlib.mutabletree
56
75
from bzrlib.mutabletree import needs_tree_write_lock
57
76
from bzrlib.osutils import (
58
77
    file_kind,
59
78
    isdir,
 
79
    normpath,
60
80
    pathjoin,
 
81
    rand_chars,
61
82
    realpath,
62
83
    safe_unicode,
 
84
    splitpath,
63
85
    )
64
 
from bzrlib.trace import mutter
 
86
from bzrlib.trace import mutter, note
65
87
from bzrlib.transport.local import LocalTransport
66
88
from bzrlib.tree import InterTree
 
89
from bzrlib.progress import DummyProgress, ProgressPhase
 
90
from bzrlib.revision import NULL_REVISION, CURRENT_REVISION
 
91
from bzrlib.rio import RioReader, rio_file, Stanza
 
92
from bzrlib.symbol_versioning import (deprecated_passed,
 
93
        deprecated_method,
 
94
        deprecated_function,
 
95
        DEPRECATED_PARAMETER,
 
96
        )
67
97
from bzrlib.tree import Tree
68
98
from bzrlib.workingtree import WorkingTree, WorkingTree3, WorkingTreeFormat3
69
99
 
70
100
 
71
 
class DirStateWorkingTree(WorkingTree3):
 
101
# This is the Windows equivalent of ENOTDIR
 
102
# It is defined in pywin32.winerror, but we don't want a strong dependency for
 
103
# just an error code.
 
104
ERROR_PATH_NOT_FOUND = 3
 
105
ERROR_DIRECTORY = 267
 
106
 
 
107
 
 
108
class WorkingTree4(WorkingTree3):
 
109
    """This is the Format 4 working tree.
 
110
 
 
111
    This differs from WorkingTree3 by:
 
112
     - Having a consolidated internal dirstate, stored in a
 
113
       randomly-accessible sorted file on disk.
 
114
     - Not having a regular inventory attribute.  One can be synthesized 
 
115
       on demand but this is expensive and should be avoided.
 
116
 
 
117
    This is new in bzr 0.15.
 
118
    """
 
119
 
72
120
    def __init__(self, basedir,
73
121
                 branch,
74
122
                 _control_files=None,
100
148
        #-------------
101
149
        self._setup_directory_is_tree_reference()
102
150
        self._detect_case_handling()
103
 
        self._rules_searcher = None
104
 
        self.views = self._make_views()
105
 
        #--- allow tests to select the dirstate iter_changes implementation
106
 
        self._iter_changes = dirstate._process_entry
107
151
 
108
152
    @needs_tree_write_lock
109
153
    def _add(self, files, ids, kinds):
137
181
    @needs_tree_write_lock
138
182
    def add_reference(self, sub_tree):
139
183
        # use standard implementation, which calls back to self._add
140
 
        #
 
184
        # 
141
185
        # So we don't store the reference_revision in the working dirstate,
142
 
        # it's just recorded at the moment of commit.
 
186
        # it's just recorded at the moment of commit. 
143
187
        self._add_reference(sub_tree)
144
188
 
145
189
    def break_lock(self):
184
228
            WorkingTree3._comparison_data(self, entry, path)
185
229
        # it looks like a plain directory, but it's really a reference -- see
186
230
        # also kind()
187
 
        if (self._repo_supports_tree_reference and kind == 'directory'
188
 
            and entry is not None and entry.kind == 'tree-reference'):
 
231
        if (self._repo_supports_tree_reference and
 
232
            kind == 'directory' and
 
233
            self._directory_is_tree_reference(path)):
189
234
            kind = 'tree-reference'
190
235
        return kind, executable, stat_value
191
236
 
217
262
            return self._dirstate
218
263
        local_path = self.bzrdir.get_workingtree_transport(None
219
264
            ).local_abspath('dirstate')
220
 
        self._dirstate = dirstate.DirState.on_file(local_path,
221
 
            self._sha1_provider())
 
265
        self._dirstate = dirstate.DirState.on_file(local_path)
222
266
        return self._dirstate
223
267
 
224
 
    def _sha1_provider(self):
225
 
        """A function that returns a SHA1Provider suitable for this tree.
226
 
 
227
 
        :return: None if content filtering is not supported by this tree.
228
 
          Otherwise, a SHA1Provider is returned that sha's the canonical
229
 
          form of files, i.e. after read filters are applied.
230
 
        """
231
 
        if self.supports_content_filtering():
232
 
            return ContentFilterAwareSHA1Provider(self)
233
 
        else:
234
 
            return None
235
 
 
236
268
    def filter_unversioned_files(self, paths):
237
269
        """Filter out paths that are versioned.
238
270
 
270
302
 
271
303
    def _generate_inventory(self):
272
304
        """Create and set self.inventory from the dirstate object.
273
 
 
 
305
        
274
306
        This is relatively expensive: we have to walk the entire dirstate.
275
307
        Ideally we would not, and can deprecate this function.
276
308
        """
321
353
                    parent_ies[(dirname + '/' + name).strip('/')] = inv_entry
322
354
                elif kind == 'tree-reference':
323
355
                    if not self._repo_supports_tree_reference:
324
 
                        raise errors.UnsupportedOperation(
325
 
                            self._generate_inventory,
326
 
                            self.branch.repository)
 
356
                        raise AssertionError(
 
357
                            "repository of %r "
 
358
                            "doesn't support tree references "
 
359
                            "required by entry %r"
 
360
                            % (self, name))
327
361
                    inv_entry.reference_revision = link_or_sha1 or None
328
362
                elif kind != 'symlink':
329
363
                    raise AssertionError("unknown kind %r" % kind)
344
378
        If either file_id or path is supplied, it is used as the key to lookup.
345
379
        If both are supplied, the fastest lookup is used, and an error is
346
380
        raised if they do not both point at the same row.
347
 
 
 
381
        
348
382
        :param file_id: An optional unicode file_id to be looked up.
349
383
        :param path: An optional unicode path to be looked up.
350
384
        :return: The dirstate row tuple for path/file_id, or (None, None)
374
408
                    return None
375
409
                else:
376
410
                    raise
377
 
        link_or_sha1 = dirstate.update_entry(state, entry, file_abspath,
378
 
            stat_value=stat_value)
 
411
        link_or_sha1 = state.update_entry(entry, file_abspath,
 
412
                                          stat_value=stat_value)
379
413
        if entry[1][0][0] == 'f':
380
 
            if link_or_sha1 is None:
381
 
                file_obj, statvalue = self.get_file_with_stat(file_id, path)
382
 
                try:
383
 
                    sha1 = osutils.sha_file(file_obj)
384
 
                finally:
385
 
                    file_obj.close()
386
 
                self._observed_sha1(file_id, path, (sha1, statvalue))
387
 
                return sha1
388
 
            else:
389
 
                return link_or_sha1
 
414
            return link_or_sha1
390
415
        return None
391
416
 
392
417
    def _get_inventory(self):
406
431
    @needs_read_lock
407
432
    def get_parent_ids(self):
408
433
        """See Tree.get_parent_ids.
409
 
 
 
434
        
410
435
        This implementation requests the ids list from the dirstate file.
411
436
        """
412
437
        return self.current_dirstate().get_parent_ids()
434
459
        return osutils.lexists(pathjoin(
435
460
                    self.basedir, row[0].decode('utf8'), row[1].decode('utf8')))
436
461
 
437
 
    def has_or_had_id(self, file_id):
438
 
        state = self.current_dirstate()
439
 
        row, parents = self._get_entry(file_id=file_id)
440
 
        return row is not None
441
 
 
442
462
    @needs_read_lock
443
463
    def id2path(self, file_id):
444
464
        "Convert a file-id to a path."
508
528
        return iter(result)
509
529
 
510
530
    def iter_references(self):
511
 
        if not self._repo_supports_tree_reference:
512
 
            # When the repo doesn't support references, we will have nothing to
513
 
            # return
514
 
            return
515
531
        for key, tree_details in self.current_dirstate()._iter_entries():
516
532
            if tree_details[0][0] in ('a', 'r'): # absent, relocated
517
533
                # not relevant to the working tree
519
535
            if not key[1]:
520
536
                # the root is not a reference.
521
537
                continue
522
 
            relpath = pathjoin(key[0].decode('utf8'), key[1].decode('utf8'))
 
538
            path = pathjoin(self.basedir, key[0].decode('utf8'), key[1].decode('utf8'))
523
539
            try:
524
 
                if self._kind(relpath) == 'tree-reference':
525
 
                    yield relpath, key[2]
 
540
                if self._kind(path) == 'tree-reference':
 
541
                    yield path, key[2]
526
542
            except errors.NoSuchFile:
527
543
                # path is missing on disk.
528
544
                continue
529
545
 
530
 
    def _observed_sha1(self, file_id, path, (sha1, statvalue)):
531
 
        """See MutableTree._observed_sha1."""
532
 
        state = self.current_dirstate()
533
 
        entry = self._get_entry(file_id=file_id, path=path)
534
 
        state._observed_sha1(entry, sha1, statvalue)
535
 
 
536
546
    def kind(self, file_id):
537
547
        """Return the kind of a file.
538
548
 
550
560
    def _kind(self, relpath):
551
561
        abspath = self.abspath(relpath)
552
562
        kind = file_kind(abspath)
553
 
        if (self._repo_supports_tree_reference and kind == 'directory'):
554
 
            entry = self._get_entry(path=relpath)
555
 
            if entry[1] is not None:
556
 
                if entry[1][0][0] == 't':
557
 
                    kind = 'tree-reference'
 
563
        if (self._repo_supports_tree_reference and
 
564
            kind == 'directory' and
 
565
            self._directory_is_tree_reference(relpath)):
 
566
            kind = 'tree-reference'
558
567
        return kind
559
568
 
560
569
    @needs_read_lock
567
576
            return _mod_revision.NULL_REVISION
568
577
 
569
578
    def lock_read(self):
570
 
        """See Branch.lock_read, and WorkingTree.unlock.
571
 
 
572
 
        :return: An object with an unlock method which will release the lock
573
 
            obtained.
574
 
        """
 
579
        """See Branch.lock_read, and WorkingTree.unlock."""
575
580
        self.branch.lock_read()
576
581
        try:
577
582
            self._control_files.lock_read()
590
595
        except:
591
596
            self.branch.unlock()
592
597
            raise
593
 
        return self
594
598
 
595
599
    def _lock_self_write(self):
596
600
        """This should be called after the branch is locked."""
611
615
        except:
612
616
            self.branch.unlock()
613
617
            raise
614
 
        return self
615
618
 
616
619
    def lock_tree_write(self):
617
 
        """See MutableTree.lock_tree_write, and WorkingTree.unlock.
618
 
 
619
 
        :return: An object with an unlock method which will release the lock
620
 
            obtained.
621
 
        """
 
620
        """See MutableTree.lock_tree_write, and WorkingTree.unlock."""
622
621
        self.branch.lock_read()
623
 
        return self._lock_self_write()
 
622
        self._lock_self_write()
624
623
 
625
624
    def lock_write(self):
626
 
        """See MutableTree.lock_write, and WorkingTree.unlock.
627
 
 
628
 
        :return: An object with an unlock method which will release the lock
629
 
            obtained.
630
 
        """
 
625
        """See MutableTree.lock_write, and WorkingTree.unlock."""
631
626
        self.branch.lock_write()
632
 
        return self._lock_self_write()
 
627
        self._lock_self_write()
633
628
 
634
629
    @needs_tree_write_lock
635
630
    def move(self, from_paths, to_dir, after=False):
705
700
            from_entry = self._get_entry(path=from_rel)
706
701
            if from_entry == (None, None):
707
702
                raise errors.BzrMoveFailedError(from_rel,to_dir,
708
 
                    errors.NotVersionedError(path=from_rel))
 
703
                    errors.NotVersionedError(path=str(from_rel)))
709
704
 
710
705
            from_id = from_entry[0][2]
711
706
            to_rel = pathjoin(to_dir, from_tail)
886
881
        for tree in trees:
887
882
            if not (isinstance(tree, DirStateRevisionTree) and tree._revision_id in
888
883
                parents):
889
 
                return super(DirStateWorkingTree, self).paths2ids(paths,
890
 
                    trees, require_versioned)
 
884
                return super(WorkingTree4, self).paths2ids(paths, trees, require_versioned)
891
885
        search_indexes = [0] + [1 + parents.index(tree._revision_id) for tree in trees]
892
886
        # -- make all paths utf8 --
893
887
        paths_utf8 = set()
954
948
                raise errors.PathsNotVersionedError(paths)
955
949
        # -- remove redundancy in supplied paths to prevent over-scanning --
956
950
        search_paths = osutils.minimum_path_selection(paths)
957
 
        # sketch:
 
951
        # sketch: 
958
952
        # for all search_indexs in each path at or under each element of
959
953
        # search_paths, if the detail is relocated: add the id, and add the
960
954
        # relocated path as one to search if its not searched already. If the
1016
1010
 
1017
1011
    def read_working_inventory(self):
1018
1012
        """Read the working inventory.
1019
 
 
 
1013
        
1020
1014
        This is a meaningless operation for dirstate, but we obey it anyhow.
1021
1015
        """
1022
1016
        return self.inventory
1040
1034
    def set_last_revision(self, new_revision):
1041
1035
        """Change the last revision in the working tree."""
1042
1036
        parents = self.get_parent_ids()
1043
 
        if new_revision in (_mod_revision.NULL_REVISION, None):
 
1037
        if new_revision in (NULL_REVISION, None):
1044
1038
            if len(parents) >= 2:
1045
1039
                raise AssertionError(
1046
1040
                    "setting the last parent to none with a pending merge is "
1053
1047
    @needs_tree_write_lock
1054
1048
    def set_parent_ids(self, revision_ids, allow_leftmost_as_ghost=False):
1055
1049
        """Set the parent ids to revision_ids.
1056
 
 
 
1050
        
1057
1051
        See also set_parent_trees. This api will try to retrieve the tree data
1058
1052
        for each element of revision_ids from the trees repository. If you have
1059
1053
        tree data already available, it is more efficient to use
1111
1105
                real_trees.append((rev_id, tree))
1112
1106
            else:
1113
1107
                real_trees.append((rev_id,
1114
 
                    self.branch.repository.revision_tree(
1115
 
                        _mod_revision.NULL_REVISION)))
 
1108
                    self.branch.repository.revision_tree(None)))
1116
1109
                ghosts.append(rev_id)
1117
1110
            accepted_revisions.add(rev_id)
1118
1111
        dirstate.set_parent_trees(real_trees, ghosts=ghosts)
1213
1206
                # just forget the whole block.
1214
1207
                entry_index = 0
1215
1208
                while entry_index < len(block[1]):
 
1209
                    # Mark this file id as having been removed
1216
1210
                    entry = block[1][entry_index]
1217
 
                    if entry[1][0][0] in 'ar':
1218
 
                        # don't remove absent or renamed entries
 
1211
                    ids_to_unversion.discard(entry[0][2])
 
1212
                    if (entry[1][0][0] in 'ar' # don't remove absent or renamed
 
1213
                                               # entries
 
1214
                        or not state._make_absent(entry)):
1219
1215
                        entry_index += 1
1220
 
                    else:
1221
 
                        # Mark this file id as having been removed
1222
 
                        ids_to_unversion.discard(entry[0][2])
1223
 
                        if not state._make_absent(entry):
1224
 
                            # The block has not shrunk.
1225
 
                            entry_index += 1
1226
1216
                # go to the next block. (At the moment we dont delete empty
1227
1217
                # dirblocks)
1228
1218
                block_index += 1
1280
1270
        if self._dirty:
1281
1271
            raise AssertionError("attempting to write an inventory when the "
1282
1272
                "dirstate is dirty will lose pending changes")
1283
 
        had_inventory = self._inventory is not None
1284
 
        # Setting self._inventory = None forces the dirstate to regenerate the
1285
 
        # working inventory. We do this because self.inventory may be inv, or
1286
 
        # may have been modified, and either case would prevent a clean delta
1287
 
        # being created.
1288
 
        self._inventory = None
1289
 
        # generate a delta,
1290
 
        delta = inv._make_delta(self.inventory)
1291
 
        # and apply it.
1292
 
        self.apply_inventory_delta(delta)
1293
 
        if had_inventory:
 
1273
        self.current_dirstate().set_state_from_inventory(inv)
 
1274
        self._make_dirty(reset_inventory=False)
 
1275
        if self._inventory is not None:
1294
1276
            self._inventory = inv
1295
1277
        self.flush()
1296
1278
 
1297
1279
 
1298
 
class ContentFilterAwareSHA1Provider(dirstate.SHA1Provider):
1299
 
 
1300
 
    def __init__(self, tree):
1301
 
        self.tree = tree
1302
 
 
1303
 
    def sha1(self, abspath):
1304
 
        """See dirstate.SHA1Provider.sha1()."""
1305
 
        filters = self.tree._content_filter_stack(
1306
 
            self.tree.relpath(osutils.safe_unicode(abspath)))
1307
 
        return internal_size_sha_file_byname(abspath, filters)[1]
1308
 
 
1309
 
    def stat_and_sha1(self, abspath):
1310
 
        """See dirstate.SHA1Provider.stat_and_sha1()."""
1311
 
        filters = self.tree._content_filter_stack(
1312
 
            self.tree.relpath(osutils.safe_unicode(abspath)))
1313
 
        file_obj = file(abspath, 'rb', 65000)
1314
 
        try:
1315
 
            statvalue = os.fstat(file_obj.fileno())
1316
 
            if filters:
1317
 
                file_obj = filtered_input_file(file_obj, filters)
1318
 
            sha1 = osutils.size_sha_file(file_obj)[1]
1319
 
        finally:
1320
 
            file_obj.close()
1321
 
        return statvalue, sha1
1322
 
 
1323
 
 
1324
 
class ContentFilteringDirStateWorkingTree(DirStateWorkingTree):
1325
 
    """Dirstate working tree that supports content filtering.
1326
 
 
1327
 
    The dirstate holds the hash and size of the canonical form of the file, 
1328
 
    and most methods must return that.
1329
 
    """
1330
 
 
1331
 
    def _file_content_summary(self, path, stat_result):
1332
 
        # This is to support the somewhat obsolete path_content_summary method
1333
 
        # with content filtering: see
1334
 
        # <https://bugs.edge.launchpad.net/bzr/+bug/415508>.
1335
 
        #
1336
 
        # If the dirstate cache is up to date and knows the hash and size,
1337
 
        # return that.
1338
 
        # Otherwise if there are no content filters, return the on-disk size
1339
 
        # and leave the hash blank.
1340
 
        # Otherwise, read and filter the on-disk file and use its size and
1341
 
        # hash.
1342
 
        #
1343
 
        # The dirstate doesn't store the size of the canonical form so we
1344
 
        # can't trust it for content-filtered trees.  We just return None.
1345
 
        dirstate_sha1 = self._dirstate.sha1_from_stat(path, stat_result)
1346
 
        executable = self._is_executable_from_path_and_stat(path, stat_result)
1347
 
        return ('file', None, executable, dirstate_sha1)
1348
 
 
1349
 
 
1350
 
class WorkingTree4(DirStateWorkingTree):
1351
 
    """This is the Format 4 working tree.
1352
 
 
1353
 
    This differs from WorkingTree3 by:
1354
 
     - Having a consolidated internal dirstate, stored in a
1355
 
       randomly-accessible sorted file on disk.
1356
 
     - Not having a regular inventory attribute.  One can be synthesized
1357
 
       on demand but this is expensive and should be avoided.
1358
 
 
1359
 
    This is new in bzr 0.15.
1360
 
    """
1361
 
 
1362
 
 
1363
 
class WorkingTree5(ContentFilteringDirStateWorkingTree):
1364
 
    """This is the Format 5 working tree.
1365
 
 
1366
 
    This differs from WorkingTree4 by:
1367
 
     - Supporting content filtering.
1368
 
 
1369
 
    This is new in bzr 1.11.
1370
 
    """
1371
 
 
1372
 
 
1373
 
class WorkingTree6(ContentFilteringDirStateWorkingTree):
1374
 
    """This is the Format 6 working tree.
1375
 
 
1376
 
    This differs from WorkingTree5 by:
1377
 
     - Supporting a current view that may mask the set of files in a tree
1378
 
       impacted by most user operations.
1379
 
 
1380
 
    This is new in bzr 1.14.
1381
 
    """
1382
 
 
1383
 
    def _make_views(self):
1384
 
        return views.PathBasedViews(self)
1385
 
 
1386
 
 
1387
 
class DirStateWorkingTreeFormat(WorkingTreeFormat3):
 
1280
class WorkingTreeFormat4(WorkingTreeFormat3):
 
1281
    """The first consolidated dirstate working tree format.
 
1282
 
 
1283
    This format:
 
1284
        - exists within a metadir controlling .bzr
 
1285
        - includes an explicit version marker for the workingtree control
 
1286
          files, separate from the BzrDir format
 
1287
        - modifies the hash cache format
 
1288
        - is new in bzr 0.15
 
1289
        - uses a LockDir to guard access to it.
 
1290
    """
 
1291
 
 
1292
    upgrade_recommended = False
 
1293
 
 
1294
    def get_format_string(self):
 
1295
        """See WorkingTreeFormat.get_format_string()."""
 
1296
        return "Bazaar Working Tree Format 4 (bzr 0.15)\n"
 
1297
 
 
1298
    def get_format_description(self):
 
1299
        """See WorkingTreeFormat.get_format_description()."""
 
1300
        return "Working tree format 4"
1388
1301
 
1389
1302
    def initialize(self, a_bzrdir, revision_id=None, from_branch=None,
1390
1303
                   accelerator_tree=None, hardlink=False):
1421
1334
        state = dirstate.DirState.initialize(local_path)
1422
1335
        state.unlock()
1423
1336
        del state
1424
 
        wt = self._tree_class(a_bzrdir.root_transport.local_abspath('.'),
 
1337
        wt = WorkingTree4(a_bzrdir.root_transport.local_abspath('.'),
1425
1338
                         branch,
1426
1339
                         _format=self,
1427
1340
                         _bzrdir=a_bzrdir,
1429
1342
        wt._new_tree()
1430
1343
        wt.lock_tree_write()
1431
1344
        try:
1432
 
            self._init_custom_control_files(wt)
1433
 
            if revision_id in (None, _mod_revision.NULL_REVISION):
 
1345
            if revision_id in (None, NULL_REVISION):
1434
1346
                if branch.repository.supports_rich_root():
1435
1347
                    wt._set_root_id(generate_ids.gen_root_id())
1436
1348
                else:
1447
1359
                    pass
1448
1360
            if basis is None:
1449
1361
                basis = branch.repository.revision_tree(revision_id)
1450
 
            if revision_id == _mod_revision.NULL_REVISION:
 
1362
            if revision_id == NULL_REVISION:
1451
1363
                parents_list = []
1452
1364
            else:
1453
1365
                parents_list = [(revision_id, basis)]
1461
1373
                if basis_root_id is not None:
1462
1374
                    wt._set_root_id(basis_root_id)
1463
1375
                    wt.flush()
1464
 
                if wt.supports_content_filtering():
1465
 
                    # The original tree may not have the same content filters
1466
 
                    # applied so we can't safely build the inventory delta from
1467
 
                    # the source tree.
1468
 
                    delta_from_tree = False
1469
 
                else:
1470
 
                    delta_from_tree = True
1471
1376
                # delta_from_tree is safe even for DirStateRevisionTrees,
1472
1377
                # because wt4.apply_inventory_delta does not mutate the input
1473
1378
                # inventory entries.
1474
1379
                transform.build_tree(basis, wt, accelerator_tree,
1475
 
                                     hardlink=hardlink,
1476
 
                                     delta_from_tree=delta_from_tree)
 
1380
                                     hardlink=hardlink, delta_from_tree=True)
1477
1381
            finally:
1478
1382
                basis.unlock()
1479
1383
        finally:
1481
1385
            wt.unlock()
1482
1386
        return wt
1483
1387
 
1484
 
    def _init_custom_control_files(self, wt):
1485
 
        """Subclasses with custom control files should override this method.
1486
 
 
1487
 
        The working tree and control files are locked for writing when this
1488
 
        method is called.
1489
 
 
1490
 
        :param wt: the WorkingTree object
1491
 
        """
1492
 
 
1493
1388
    def _open(self, a_bzrdir, control_files):
1494
1389
        """Open the tree itself.
1495
1390
 
1496
1391
        :param a_bzrdir: the dir for the tree.
1497
1392
        :param control_files: the control files for the tree.
1498
1393
        """
1499
 
        return self._tree_class(a_bzrdir.root_transport.local_abspath('.'),
 
1394
        return WorkingTree4(a_bzrdir.root_transport.local_abspath('.'),
1500
1395
                           branch=a_bzrdir.open_branch(),
1501
1396
                           _format=self,
1502
1397
                           _bzrdir=a_bzrdir,
1503
1398
                           _control_files=control_files)
1504
1399
 
1505
1400
    def __get_matchingbzrdir(self):
1506
 
        return self._get_matchingbzrdir()
1507
 
 
1508
 
    def _get_matchingbzrdir(self):
1509
 
        """Overrideable method to get a bzrdir for testing."""
1510
1401
        # please test against something that will let us do tree references
1511
1402
        return bzrdir.format_registry.make_bzrdir(
1512
1403
            'dirstate-with-subtree')
1514
1405
    _matchingbzrdir = property(__get_matchingbzrdir)
1515
1406
 
1516
1407
 
1517
 
class WorkingTreeFormat4(DirStateWorkingTreeFormat):
1518
 
    """The first consolidated dirstate working tree format.
1519
 
 
1520
 
    This format:
1521
 
        - exists within a metadir controlling .bzr
1522
 
        - includes an explicit version marker for the workingtree control
1523
 
          files, separate from the BzrDir format
1524
 
        - modifies the hash cache format
1525
 
        - is new in bzr 0.15
1526
 
        - uses a LockDir to guard access to it.
1527
 
    """
1528
 
 
1529
 
    upgrade_recommended = False
1530
 
 
1531
 
    _tree_class = WorkingTree4
1532
 
 
1533
 
    def get_format_string(self):
1534
 
        """See WorkingTreeFormat.get_format_string()."""
1535
 
        return "Bazaar Working Tree Format 4 (bzr 0.15)\n"
1536
 
 
1537
 
    def get_format_description(self):
1538
 
        """See WorkingTreeFormat.get_format_description()."""
1539
 
        return "Working tree format 4"
1540
 
 
1541
 
 
1542
 
class WorkingTreeFormat5(DirStateWorkingTreeFormat):
1543
 
    """WorkingTree format supporting content filtering.
1544
 
    """
1545
 
 
1546
 
    upgrade_recommended = False
1547
 
 
1548
 
    _tree_class = WorkingTree5
1549
 
 
1550
 
    def get_format_string(self):
1551
 
        """See WorkingTreeFormat.get_format_string()."""
1552
 
        return "Bazaar Working Tree Format 5 (bzr 1.11)\n"
1553
 
 
1554
 
    def get_format_description(self):
1555
 
        """See WorkingTreeFormat.get_format_description()."""
1556
 
        return "Working tree format 5"
1557
 
 
1558
 
    def supports_content_filtering(self):
1559
 
        return True
1560
 
 
1561
 
 
1562
 
class WorkingTreeFormat6(DirStateWorkingTreeFormat):
1563
 
    """WorkingTree format supporting views.
1564
 
    """
1565
 
 
1566
 
    upgrade_recommended = False
1567
 
 
1568
 
    _tree_class = WorkingTree6
1569
 
 
1570
 
    def get_format_string(self):
1571
 
        """See WorkingTreeFormat.get_format_string()."""
1572
 
        return "Bazaar Working Tree Format 6 (bzr 1.14)\n"
1573
 
 
1574
 
    def get_format_description(self):
1575
 
        """See WorkingTreeFormat.get_format_description()."""
1576
 
        return "Working tree format 6"
1577
 
 
1578
 
    def _init_custom_control_files(self, wt):
1579
 
        """Subclasses with custom control files should override this method."""
1580
 
        wt._transport.put_bytes('views', '', mode=wt.bzrdir._get_file_mode())
1581
 
 
1582
 
    def supports_content_filtering(self):
1583
 
        return True
1584
 
 
1585
 
    def supports_views(self):
1586
 
        return True
1587
 
 
1588
 
 
1589
1408
class DirStateRevisionTree(Tree):
1590
 
    """A revision tree pulling the inventory from a dirstate.
1591
 
    
1592
 
    Note that this is one of the historical (ie revision) trees cached in the
1593
 
    dirstate for easy access, not the workingtree.
1594
 
    """
 
1409
    """A revision tree pulling the inventory from a dirstate."""
1595
1410
 
1596
1411
    def __init__(self, dirstate, revision_id, repository):
1597
1412
        self._dirstate = dirstate
1600
1415
        self._inventory = None
1601
1416
        self._locked = 0
1602
1417
        self._dirstate_locked = False
1603
 
        self._repo_supports_tree_reference = getattr(
1604
 
            repository._format, "supports_tree_reference",
1605
 
            False)
1606
1418
 
1607
1419
    def __repr__(self):
1608
1420
        return "<%s of %s in %s>" % \
1611
1423
    def annotate_iter(self, file_id,
1612
1424
                      default_revision=_mod_revision.CURRENT_REVISION):
1613
1425
        """See Tree.annotate_iter"""
1614
 
        text_key = (file_id, self.inventory[file_id].revision)
1615
 
        annotations = self._repository.texts.annotate(text_key)
1616
 
        return [(key[-1], line) for (key, line) in annotations]
 
1426
        w = self._get_weave(file_id)
 
1427
        return w.annotate(self.inventory[file_id].revision)
1617
1428
 
1618
1429
    def _get_ancestors(self, default_revision):
1619
1430
        return set(self._repository.get_ancestry(self._revision_id,
1648
1459
        path_utf8 = osutils.pathjoin(entry[0][0], entry[0][1])
1649
1460
        return path_utf8.decode('utf8')
1650
1461
 
1651
 
    def iter_references(self):
1652
 
        if not self._repo_supports_tree_reference:
1653
 
            # When the repo doesn't support references, we will have nothing to
1654
 
            # return
1655
 
            return iter([])
1656
 
        # Otherwise, fall back to the default implementation
1657
 
        return super(DirStateRevisionTree, self).iter_references()
1658
 
 
1659
1462
    def _get_parent_index(self):
1660
1463
        """Return the index in the dirstate referenced by this tree."""
1661
1464
        return self._dirstate.get_parent_ids().index(self._revision_id) + 1
1666
1469
        If either file_id or path is supplied, it is used as the key to lookup.
1667
1470
        If both are supplied, the fastest lookup is used, and an error is
1668
1471
        raised if they do not both point at the same row.
1669
 
 
 
1472
        
1670
1473
        :param file_id: An optional unicode file_id to be looked up.
1671
1474
        :param path: An optional unicode path to be looked up.
1672
1475
        :return: The dirstate row tuple for path/file_id, or (None, None)
1769
1572
            return None
1770
1573
        parent_index = self._get_parent_index()
1771
1574
        last_changed_revision = entry[1][parent_index][4]
1772
 
        try:
1773
 
            rev = self._repository.get_revision(last_changed_revision)
1774
 
        except errors.NoSuchRevision:
1775
 
            raise errors.FileTimestampUnavailable(self.id2path(file_id))
1776
 
        return rev.timestamp
 
1575
        return self._repository.get_revision(last_changed_revision).timestamp
1777
1576
 
1778
1577
    def get_file_sha1(self, file_id, path=None, stat_value=None):
1779
1578
        entry = self._get_entry(file_id=file_id, path=path)
1783
1582
            return parent_details[1]
1784
1583
        return None
1785
1584
 
 
1585
    def _get_weave(self, file_id):
 
1586
        return self._repository.weave_store.get_weave(file_id,
 
1587
                self._repository.get_transaction())
 
1588
 
1786
1589
    def get_file(self, file_id, path=None):
1787
1590
        return StringIO(self.get_file_text(file_id))
1788
1591
 
 
1592
    def get_file_lines(self, file_id):
 
1593
        entry = self._get_entry(file_id=file_id)[1]
 
1594
        if entry is None:
 
1595
            raise errors.NoSuchId(tree=self, file_id=file_id)
 
1596
        return self._get_weave(file_id).get_lines(entry[1][4])
 
1597
 
1789
1598
    def get_file_size(self, file_id):
1790
1599
        """See Tree.get_file_size"""
1791
1600
        return self.inventory[file_id].text_size
1792
1601
 
1793
 
    def get_file_text(self, file_id, path=None):
1794
 
        _, content = list(self.iter_files_bytes([(file_id, None)]))[0]
1795
 
        return ''.join(content)
 
1602
    def get_file_text(self, file_id):
 
1603
        return ''.join(self.get_file_lines(file_id))
1796
1604
 
1797
1605
    def get_reference_revision(self, file_id, path=None):
1798
1606
        return self.inventory[file_id].reference_revision
1817
1625
        if entry[1][parent_index][0] != 'l':
1818
1626
            return None
1819
1627
        else:
1820
 
            target = entry[1][parent_index][1]
1821
 
            target = target.decode('utf8')
1822
 
            return target
 
1628
            # At present, none of the tree implementations supports non-ascii
 
1629
            # symlink targets. So we will just assume that the dirstate path is
 
1630
            # correct.
 
1631
            return entry[1][parent_index][1]
1823
1632
 
1824
1633
    def get_revision_id(self):
1825
1634
        """Return the revision id for this tree."""
1846
1655
        entry = self._get_entry(file_id=file_id)[1]
1847
1656
        if entry is None:
1848
1657
            raise errors.NoSuchId(tree=self, file_id=file_id)
1849
 
        parent_index = self._get_parent_index()
1850
 
        return dirstate.DirState._minikind_to_kind[entry[parent_index][0]]
 
1658
        return dirstate.DirState._minikind_to_kind[entry[1][0]]
1851
1659
 
1852
1660
    def stored_kind(self, file_id):
1853
1661
        """See Tree.stored_kind"""
1873
1681
            return None
1874
1682
        return ie.executable
1875
1683
 
1876
 
    def is_locked(self):
1877
 
        return self._locked
1878
 
 
1879
 
    def list_files(self, include_root=False, from_dir=None, recursive=True):
 
1684
    def list_files(self, include_root=False):
1880
1685
        # We use a standard implementation, because DirStateRevisionTree is
1881
1686
        # dealing with one of the parents of the current state
1882
1687
        inv = self._get_inventory()
1883
 
        if from_dir is None:
1884
 
            from_dir_id = None
1885
 
        else:
1886
 
            from_dir_id = inv.path2id(from_dir)
1887
 
            if from_dir_id is None:
1888
 
                # Directory not versioned
1889
 
                return
1890
 
        entries = inv.iter_entries(from_dir=from_dir_id, recursive=recursive)
1891
 
        if inv.root is not None and not include_root and from_dir is None:
 
1688
        entries = inv.iter_entries()
 
1689
        if self.inventory.root is not None and not include_root:
1892
1690
            entries.next()
1893
1691
        for path, entry in entries:
1894
1692
            yield path, 'V', entry.kind, entry.file_id, entry
1895
1693
 
1896
1694
    def lock_read(self):
1897
 
        """Lock the tree for a set of operations.
1898
 
 
1899
 
        :return: An object with an unlock method which will release the lock
1900
 
            obtained.
1901
 
        """
 
1695
        """Lock the tree for a set of operations."""
1902
1696
        if not self._locked:
1903
1697
            self._repository.lock_read()
1904
1698
            if self._dirstate._lock_token is None:
1905
1699
                self._dirstate.lock_read()
1906
1700
                self._dirstate_locked = True
1907
1701
        self._locked += 1
1908
 
        return self
1909
1702
 
1910
1703
    def _must_be_locked(self):
1911
1704
        if not self._locked:
1932
1725
                self._dirstate_locked = False
1933
1726
            self._repository.unlock()
1934
1727
 
1935
 
    @needs_read_lock
1936
 
    def supports_tree_reference(self):
1937
 
        return self._repo_supports_tree_reference
1938
 
 
1939
1728
    def walkdirs(self, prefix=""):
1940
1729
        # TODO: jam 20070215 This is the lazy way by using the RevisionTree
1941
 
        # implementation based on an inventory.
 
1730
        # implementation based on an inventory.  
1942
1731
        # This should be cleaned up to use the much faster Dirstate code
1943
1732
        # So for now, we just build up the parent inventory, and extract
1944
1733
        # it the same way RevisionTree does.
1973
1762
 
1974
1763
class InterDirStateTree(InterTree):
1975
1764
    """Fast path optimiser for changes_from with dirstate trees.
1976
 
 
1977
 
    This is used only when both trees are in the dirstate working file, and
1978
 
    the source is any parent within the dirstate, and the destination is
 
1765
    
 
1766
    This is used only when both trees are in the dirstate working file, and 
 
1767
    the source is any parent within the dirstate, and the destination is 
1979
1768
    the current working tree of the same dirstate.
1980
1769
    """
1981
1770
    # this could be generalized to allow comparisons between any trees in the
1994
1783
        target.set_parent_ids([revid])
1995
1784
        return target.basis_tree(), target
1996
1785
 
1997
 
    @classmethod
1998
 
    def make_source_parent_tree_python_dirstate(klass, test_case, source, target):
1999
 
        result = klass.make_source_parent_tree(source, target)
2000
 
        result[1]._iter_changes = dirstate.ProcessEntryPython
2001
 
        return result
2002
 
 
2003
 
    @classmethod
2004
 
    def make_source_parent_tree_compiled_dirstate(klass, test_case, source,
2005
 
                                                  target):
2006
 
        from bzrlib.tests.test__dirstate_helpers import \
2007
 
            compiled_dirstate_helpers_feature
2008
 
        test_case.requireFeature(compiled_dirstate_helpers_feature)
2009
 
        from bzrlib._dirstate_helpers_pyx import ProcessEntryC
2010
 
        result = klass.make_source_parent_tree(source, target)
2011
 
        result[1]._iter_changes = ProcessEntryC
2012
 
        return result
2013
 
 
2014
1786
    _matching_from_tree_format = WorkingTreeFormat4()
2015
1787
    _matching_to_tree_format = WorkingTreeFormat4()
2016
 
 
2017
 
    @classmethod
2018
 
    def _test_mutable_trees_to_test_trees(klass, test_case, source, target):
2019
 
        # This method shouldn't be called, because we have python and C
2020
 
        # specific flavours.
2021
 
        raise NotImplementedError
 
1788
    _test_mutable_trees_to_test_trees = make_source_parent_tree
2022
1789
 
2023
1790
    def iter_changes(self, include_unchanged=False,
2024
1791
                      specific_files=None, pb=None, extra_trees=[],
2042
1809
            output. An unversioned file is defined as one with (False, False)
2043
1810
            for the versioned pair.
2044
1811
        """
 
1812
        utf8_decode = cache_utf8._utf8_decode
 
1813
        _minikind_to_kind = dirstate.DirState._minikind_to_kind
 
1814
        cmp_by_dirs = dirstate.cmp_by_dirs
 
1815
        # NB: show_status depends on being able to pass in non-versioned files
 
1816
        # and report them as unknown
2045
1817
        # TODO: handle extra trees in the dirstate.
2046
1818
        if (extra_trees or specific_files == []):
2047
1819
            # we can't fast-path these cases (yet)
2048
 
            return super(InterDirStateTree, self).iter_changes(
 
1820
            for f in super(InterDirStateTree, self).iter_changes(
2049
1821
                include_unchanged, specific_files, pb, extra_trees,
2050
 
                require_versioned, want_unversioned=want_unversioned)
 
1822
                require_versioned, want_unversioned=want_unversioned):
 
1823
                yield f
 
1824
            return
2051
1825
        parent_ids = self.target.get_parent_ids()
2052
1826
        if not (self.source._revision_id in parent_ids
2053
 
                or self.source._revision_id == _mod_revision.NULL_REVISION):
 
1827
                or self.source._revision_id == NULL_REVISION):
2054
1828
            raise AssertionError(
2055
1829
                "revision {%s} is not stored in {%s}, but %s "
2056
1830
                "can only be used for trees stored in the dirstate"
2057
1831
                % (self.source._revision_id, self.target, self.iter_changes))
2058
1832
        target_index = 0
2059
 
        if self.source._revision_id == _mod_revision.NULL_REVISION:
 
1833
        if self.source._revision_id == NULL_REVISION:
2060
1834
            source_index = None
2061
1835
            indices = (target_index,)
2062
1836
        else:
2070
1844
        if specific_files:
2071
1845
            specific_files_utf8 = set()
2072
1846
            for path in specific_files:
2073
 
                # Note, if there are many specific files, using cache_utf8
2074
 
                # would be good here.
2075
1847
                specific_files_utf8.add(path.encode('utf8'))
2076
1848
            specific_files = specific_files_utf8
2077
1849
        else:
2078
1850
            specific_files = set([''])
2079
1851
        # -- specific_files is now a utf8 path set --
2080
 
 
2081
1852
        # -- get the state object and prepare it.
2082
1853
        state = self.target.current_dirstate()
2083
1854
        state._read_dirblocks_if_needed()
 
1855
        def _entries_for_path(path):
 
1856
            """Return a list with all the entries that match path for all ids.
 
1857
            """
 
1858
            dirname, basename = os.path.split(path)
 
1859
            key = (dirname, basename, '')
 
1860
            block_index, present = state._find_block_index_from_key(key)
 
1861
            if not present:
 
1862
                # the block which should contain path is absent.
 
1863
                return []
 
1864
            result = []
 
1865
            block = state._dirblocks[block_index][1]
 
1866
            entry_index, _ = state._find_entry_index(key, block)
 
1867
            # we may need to look at multiple entries at this path: walk while the specific_files match.
 
1868
            while (entry_index < len(block) and
 
1869
                block[entry_index][0][0:2] == key[0:2]):
 
1870
                result.append(block[entry_index])
 
1871
                entry_index += 1
 
1872
            return result
2084
1873
        if require_versioned:
2085
1874
            # -- check all supplied paths are versioned in a search tree. --
2086
 
            not_versioned = []
 
1875
            all_versioned = True
2087
1876
            for path in specific_files:
2088
 
                path_entries = state._entries_for_path(path)
 
1877
                path_entries = _entries_for_path(path)
2089
1878
                if not path_entries:
2090
1879
                    # this specified path is not present at all: error
2091
 
                    not_versioned.append(path)
2092
 
                    continue
 
1880
                    all_versioned = False
 
1881
                    break
2093
1882
                found_versioned = False
2094
1883
                # for each id at this path
2095
1884
                for entry in path_entries:
2102
1891
                if not found_versioned:
2103
1892
                    # none of the indexes was not 'absent' at all ids for this
2104
1893
                    # path.
2105
 
                    not_versioned.append(path)
2106
 
            if len(not_versioned) > 0:
2107
 
                raise errors.PathsNotVersionedError(not_versioned)
 
1894
                    all_versioned = False
 
1895
                    break
 
1896
            if not all_versioned:
 
1897
                raise errors.PathsNotVersionedError(specific_files)
2108
1898
        # -- remove redundancy in supplied specific_files to prevent over-scanning --
2109
 
        search_specific_files = osutils.minimum_path_selection(specific_files)
 
1899
        search_specific_files = set()
 
1900
        for path in specific_files:
 
1901
            other_specific_files = specific_files.difference(set([path]))
 
1902
            if not osutils.is_inside_any(other_specific_files, path):
 
1903
                # this is a top level path, we must check it.
 
1904
                search_specific_files.add(path)
 
1905
        # sketch: 
 
1906
        # compare source_index and target_index at or under each element of search_specific_files.
 
1907
        # follow the following comparison table. Note that we only want to do diff operations when
 
1908
        # the target is fdl because thats when the walkdirs logic will have exposed the pathinfo 
 
1909
        # for the target.
 
1910
        # cases:
 
1911
        # 
 
1912
        # Source | Target | disk | action
 
1913
        #   r    | fdlt   |      | add source to search, add id path move and perform
 
1914
        #        |        |      | diff check on source-target
 
1915
        #   r    | fdlt   |  a   | dangling file that was present in the basis. 
 
1916
        #        |        |      | ???
 
1917
        #   r    |  a     |      | add source to search
 
1918
        #   r    |  a     |  a   | 
 
1919
        #   r    |  r     |      | this path is present in a non-examined tree, skip.
 
1920
        #   r    |  r     |  a   | this path is present in a non-examined tree, skip.
 
1921
        #   a    | fdlt   |      | add new id
 
1922
        #   a    | fdlt   |  a   | dangling locally added file, skip
 
1923
        #   a    |  a     |      | not present in either tree, skip
 
1924
        #   a    |  a     |  a   | not present in any tree, skip
 
1925
        #   a    |  r     |      | not present in either tree at this path, skip as it
 
1926
        #        |        |      | may not be selected by the users list of paths.
 
1927
        #   a    |  r     |  a   | not present in either tree at this path, skip as it
 
1928
        #        |        |      | may not be selected by the users list of paths.
 
1929
        #  fdlt  | fdlt   |      | content in both: diff them
 
1930
        #  fdlt  | fdlt   |  a   | deleted locally, but not unversioned - show as deleted ?
 
1931
        #  fdlt  |  a     |      | unversioned: output deleted id for now
 
1932
        #  fdlt  |  a     |  a   | unversioned and deleted: output deleted id
 
1933
        #  fdlt  |  r     |      | relocated in this tree, so add target to search.
 
1934
        #        |        |      | Dont diff, we will see an r,fd; pair when we reach
 
1935
        #        |        |      | this id at the other path.
 
1936
        #  fdlt  |  r     |  a   | relocated in this tree, so add target to search.
 
1937
        #        |        |      | Dont diff, we will see an r,fd; pair when we reach
 
1938
        #        |        |      | this id at the other path.
 
1939
 
 
1940
        # for all search_indexs in each path at or under each element of
 
1941
        # search_specific_files, if the detail is relocated: add the id, and add the
 
1942
        # relocated path as one to search if its not searched already. If the
 
1943
        # detail is not relocated, add the id.
 
1944
        searched_specific_files = set()
 
1945
        NULL_PARENT_DETAILS = dirstate.DirState.NULL_PARENT_DETAILS
 
1946
        # Using a list so that we can access the values and change them in
 
1947
        # nested scope. Each one is [path, file_id, entry]
 
1948
        last_source_parent = [None, None]
 
1949
        last_target_parent = [None, None]
2110
1950
 
2111
1951
        use_filesystem_for_exec = (sys.platform != 'win32')
2112
 
        iter_changes = self.target._iter_changes(include_unchanged,
2113
 
            use_filesystem_for_exec, search_specific_files, state,
2114
 
            source_index, target_index, want_unversioned, self.target)
2115
 
        return iter_changes.iter_changes()
 
1952
 
 
1953
        # Just a sentry, so that _process_entry can say that this
 
1954
        # record is handled, but isn't interesting to process (unchanged)
 
1955
        uninteresting = object()
 
1956
 
 
1957
 
 
1958
        old_dirname_to_file_id = {}
 
1959
        new_dirname_to_file_id = {}
 
1960
        # TODO: jam 20070516 - Avoid the _get_entry lookup overhead by
 
1961
        #       keeping a cache of directories that we have seen.
 
1962
 
 
1963
        def _process_entry(entry, path_info):
 
1964
            """Compare an entry and real disk to generate delta information.
 
1965
 
 
1966
            :param path_info: top_relpath, basename, kind, lstat, abspath for
 
1967
                the path of entry. If None, then the path is considered absent.
 
1968
                (Perhaps we should pass in a concrete entry for this ?)
 
1969
                Basename is returned as a utf8 string because we expect this
 
1970
                tuple will be ignored, and don't want to take the time to
 
1971
                decode.
 
1972
            :return: None if these don't match
 
1973
                     A tuple of information about the change, or
 
1974
                     the object 'uninteresting' if these match, but are
 
1975
                     basically identical.
 
1976
            """
 
1977
            if source_index is None:
 
1978
                source_details = NULL_PARENT_DETAILS
 
1979
            else:
 
1980
                source_details = entry[1][source_index]
 
1981
            target_details = entry[1][target_index]
 
1982
            target_minikind = target_details[0]
 
1983
            if path_info is not None and target_minikind in 'fdlt':
 
1984
                if not (target_index == 0):
 
1985
                    raise AssertionError()
 
1986
                link_or_sha1 = state.update_entry(entry, abspath=path_info[4],
 
1987
                                                  stat_value=path_info[3])
 
1988
                # The entry may have been modified by update_entry
 
1989
                target_details = entry[1][target_index]
 
1990
                target_minikind = target_details[0]
 
1991
            else:
 
1992
                link_or_sha1 = None
 
1993
            file_id = entry[0][2]
 
1994
            source_minikind = source_details[0]
 
1995
            if source_minikind in 'fdltr' and target_minikind in 'fdlt':
 
1996
                # claimed content in both: diff
 
1997
                #   r    | fdlt   |      | add source to search, add id path move and perform
 
1998
                #        |        |      | diff check on source-target
 
1999
                #   r    | fdlt   |  a   | dangling file that was present in the basis.
 
2000
                #        |        |      | ???
 
2001
                if source_minikind in 'r':
 
2002
                    # add the source to the search path to find any children it
 
2003
                    # has.  TODO ? : only add if it is a container ?
 
2004
                    if not osutils.is_inside_any(searched_specific_files,
 
2005
                                                 source_details[1]):
 
2006
                        search_specific_files.add(source_details[1])
 
2007
                    # generate the old path; this is needed for stating later
 
2008
                    # as well.
 
2009
                    old_path = source_details[1]
 
2010
                    old_dirname, old_basename = os.path.split(old_path)
 
2011
                    path = pathjoin(entry[0][0], entry[0][1])
 
2012
                    old_entry = state._get_entry(source_index,
 
2013
                                                 path_utf8=old_path)
 
2014
                    # update the source details variable to be the real
 
2015
                    # location.
 
2016
                    if old_entry == (None, None):
 
2017
                        raise errors.CorruptDirstate(state._filename,
 
2018
                            "entry '%s/%s' is considered renamed from %r"
 
2019
                            " but source does not exist\n"
 
2020
                            "entry: %s" % (entry[0][0], entry[0][1], old_path, entry))
 
2021
                    source_details = old_entry[1][source_index]
 
2022
                    source_minikind = source_details[0]
 
2023
                else:
 
2024
                    old_dirname = entry[0][0]
 
2025
                    old_basename = entry[0][1]
 
2026
                    old_path = path = None
 
2027
                if path_info is None:
 
2028
                    # the file is missing on disk, show as removed.
 
2029
                    content_change = True
 
2030
                    target_kind = None
 
2031
                    target_exec = False
 
2032
                else:
 
2033
                    # source and target are both versioned and disk file is present.
 
2034
                    target_kind = path_info[2]
 
2035
                    if target_kind == 'directory':
 
2036
                        if path is None:
 
2037
                            old_path = path = pathjoin(old_dirname, old_basename)
 
2038
                        new_dirname_to_file_id[path] = file_id
 
2039
                        if source_minikind != 'd':
 
2040
                            content_change = True
 
2041
                        else:
 
2042
                            # directories have no fingerprint
 
2043
                            content_change = False
 
2044
                        target_exec = False
 
2045
                    elif target_kind == 'file':
 
2046
                        if source_minikind != 'f':
 
2047
                            content_change = True
 
2048
                        else:
 
2049
                            # We could check the size, but we already have the
 
2050
                            # sha1 hash.
 
2051
                            content_change = (link_or_sha1 != source_details[1])
 
2052
                        # Target details is updated at update_entry time
 
2053
                        if use_filesystem_for_exec:
 
2054
                            # We don't need S_ISREG here, because we are sure
 
2055
                            # we are dealing with a file.
 
2056
                            target_exec = bool(stat.S_IEXEC & path_info[3].st_mode)
 
2057
                        else:
 
2058
                            target_exec = target_details[3]
 
2059
                    elif target_kind == 'symlink':
 
2060
                        if source_minikind != 'l':
 
2061
                            content_change = True
 
2062
                        else:
 
2063
                            content_change = (link_or_sha1 != source_details[1])
 
2064
                        target_exec = False
 
2065
                    elif target_kind == 'tree-reference':
 
2066
                        if source_minikind != 't':
 
2067
                            content_change = True
 
2068
                        else:
 
2069
                            content_change = False
 
2070
                        target_exec = False
 
2071
                    else:
 
2072
                        raise Exception, "unknown kind %s" % path_info[2]
 
2073
                if source_minikind == 'd':
 
2074
                    if path is None:
 
2075
                        old_path = path = pathjoin(old_dirname, old_basename)
 
2076
                    old_dirname_to_file_id[old_path] = file_id
 
2077
                # parent id is the entry for the path in the target tree
 
2078
                if old_dirname == last_source_parent[0]:
 
2079
                    source_parent_id = last_source_parent[1]
 
2080
                else:
 
2081
                    try:
 
2082
                        source_parent_id = old_dirname_to_file_id[old_dirname]
 
2083
                    except KeyError:
 
2084
                        source_parent_entry = state._get_entry(source_index,
 
2085
                                                               path_utf8=old_dirname)
 
2086
                        source_parent_id = source_parent_entry[0][2]
 
2087
                    if source_parent_id == entry[0][2]:
 
2088
                        # This is the root, so the parent is None
 
2089
                        source_parent_id = None
 
2090
                    else:
 
2091
                        last_source_parent[0] = old_dirname
 
2092
                        last_source_parent[1] = source_parent_id
 
2093
                new_dirname = entry[0][0]
 
2094
                if new_dirname == last_target_parent[0]:
 
2095
                    target_parent_id = last_target_parent[1]
 
2096
                else:
 
2097
                    try:
 
2098
                        target_parent_id = new_dirname_to_file_id[new_dirname]
 
2099
                    except KeyError:
 
2100
                        # TODO: We don't always need to do the lookup, because the
 
2101
                        #       parent entry will be the same as the source entry.
 
2102
                        target_parent_entry = state._get_entry(target_index,
 
2103
                                                               path_utf8=new_dirname)
 
2104
                        if target_parent_entry == (None, None):
 
2105
                            raise AssertionError(
 
2106
                                "Could not find target parent in wt: %s\nparent of: %s"
 
2107
                                % (new_dirname, entry))
 
2108
                        target_parent_id = target_parent_entry[0][2]
 
2109
                    if target_parent_id == entry[0][2]:
 
2110
                        # This is the root, so the parent is None
 
2111
                        target_parent_id = None
 
2112
                    else:
 
2113
                        last_target_parent[0] = new_dirname
 
2114
                        last_target_parent[1] = target_parent_id
 
2115
 
 
2116
                source_exec = source_details[3]
 
2117
                if (include_unchanged
 
2118
                    or content_change
 
2119
                    or source_parent_id != target_parent_id
 
2120
                    or old_basename != entry[0][1]
 
2121
                    or source_exec != target_exec
 
2122
                    ):
 
2123
                    if old_path is None:
 
2124
                        old_path = path = pathjoin(old_dirname, old_basename)
 
2125
                        old_path_u = utf8_decode(old_path)[0]
 
2126
                        path_u = old_path_u
 
2127
                    else:
 
2128
                        old_path_u = utf8_decode(old_path)[0]
 
2129
                        if old_path == path:
 
2130
                            path_u = old_path_u
 
2131
                        else:
 
2132
                            path_u = utf8_decode(path)[0]
 
2133
                    source_kind = _minikind_to_kind[source_minikind]
 
2134
                    return (entry[0][2],
 
2135
                           (old_path_u, path_u),
 
2136
                           content_change,
 
2137
                           (True, True),
 
2138
                           (source_parent_id, target_parent_id),
 
2139
                           (utf8_decode(old_basename)[0], utf8_decode(entry[0][1])[0]),
 
2140
                           (source_kind, target_kind),
 
2141
                           (source_exec, target_exec))
 
2142
                else:
 
2143
                    return uninteresting
 
2144
            elif source_minikind in 'a' and target_minikind in 'fdlt':
 
2145
                # looks like a new file
 
2146
                if path_info is not None:
 
2147
                    path = pathjoin(entry[0][0], entry[0][1])
 
2148
                    # parent id is the entry for the path in the target tree
 
2149
                    # TODO: these are the same for an entire directory: cache em.
 
2150
                    parent_id = state._get_entry(target_index,
 
2151
                                                 path_utf8=entry[0][0])[0][2]
 
2152
                    if parent_id == entry[0][2]:
 
2153
                        parent_id = None
 
2154
                    if use_filesystem_for_exec:
 
2155
                        # We need S_ISREG here, because we aren't sure if this
 
2156
                        # is a file or not.
 
2157
                        target_exec = bool(
 
2158
                            stat.S_ISREG(path_info[3].st_mode)
 
2159
                            and stat.S_IEXEC & path_info[3].st_mode)
 
2160
                    else:
 
2161
                        target_exec = target_details[3]
 
2162
                    return (entry[0][2],
 
2163
                           (None, utf8_decode(path)[0]),
 
2164
                           True,
 
2165
                           (False, True),
 
2166
                           (None, parent_id),
 
2167
                           (None, utf8_decode(entry[0][1])[0]),
 
2168
                           (None, path_info[2]),
 
2169
                           (None, target_exec))
 
2170
                else:
 
2171
                    # but its not on disk: we deliberately treat this as just
 
2172
                    # never-present. (Why ?! - RBC 20070224)
 
2173
                    pass
 
2174
            elif source_minikind in 'fdlt' and target_minikind in 'a':
 
2175
                # unversioned, possibly, or possibly not deleted: we dont care.
 
2176
                # if its still on disk, *and* theres no other entry at this
 
2177
                # path [we dont know this in this routine at the moment -
 
2178
                # perhaps we should change this - then it would be an unknown.
 
2179
                old_path = pathjoin(entry[0][0], entry[0][1])
 
2180
                # parent id is the entry for the path in the target tree
 
2181
                parent_id = state._get_entry(source_index, path_utf8=entry[0][0])[0][2]
 
2182
                if parent_id == entry[0][2]:
 
2183
                    parent_id = None
 
2184
                return (entry[0][2],
 
2185
                       (utf8_decode(old_path)[0], None),
 
2186
                       True,
 
2187
                       (True, False),
 
2188
                       (parent_id, None),
 
2189
                       (utf8_decode(entry[0][1])[0], None),
 
2190
                       (_minikind_to_kind[source_minikind], None),
 
2191
                       (source_details[3], None))
 
2192
            elif source_minikind in 'fdlt' and target_minikind in 'r':
 
2193
                # a rename; could be a true rename, or a rename inherited from
 
2194
                # a renamed parent. TODO: handle this efficiently. Its not
 
2195
                # common case to rename dirs though, so a correct but slow
 
2196
                # implementation will do.
 
2197
                if not osutils.is_inside_any(searched_specific_files, target_details[1]):
 
2198
                    search_specific_files.add(target_details[1])
 
2199
            elif source_minikind in 'ra' and target_minikind in 'ra':
 
2200
                # neither of the selected trees contain this file,
 
2201
                # so skip over it. This is not currently directly tested, but
 
2202
                # is indirectly via test_too_much.TestCommands.test_conflicts.
 
2203
                pass
 
2204
            else:
 
2205
                raise AssertionError("don't know how to compare "
 
2206
                    "source_minikind=%r, target_minikind=%r"
 
2207
                    % (source_minikind, target_minikind))
 
2208
                ## import pdb;pdb.set_trace()
 
2209
            return None
 
2210
 
 
2211
        while search_specific_files:
 
2212
            # TODO: the pending list should be lexically sorted?  the
 
2213
            # interface doesn't require it.
 
2214
            current_root = search_specific_files.pop()
 
2215
            current_root_unicode = current_root.decode('utf8')
 
2216
            searched_specific_files.add(current_root)
 
2217
            # process the entries for this containing directory: the rest will be
 
2218
            # found by their parents recursively.
 
2219
            root_entries = _entries_for_path(current_root)
 
2220
            root_abspath = self.target.abspath(current_root_unicode)
 
2221
            try:
 
2222
                root_stat = os.lstat(root_abspath)
 
2223
            except OSError, e:
 
2224
                if e.errno == errno.ENOENT:
 
2225
                    # the path does not exist: let _process_entry know that.
 
2226
                    root_dir_info = None
 
2227
                else:
 
2228
                    # some other random error: hand it up.
 
2229
                    raise
 
2230
            else:
 
2231
                root_dir_info = ('', current_root,
 
2232
                    osutils.file_kind_from_stat_mode(root_stat.st_mode), root_stat,
 
2233
                    root_abspath)
 
2234
                if root_dir_info[2] == 'directory':
 
2235
                    if self.target._directory_is_tree_reference(
 
2236
                        current_root.decode('utf8')):
 
2237
                        root_dir_info = root_dir_info[:2] + \
 
2238
                            ('tree-reference',) + root_dir_info[3:]
 
2239
 
 
2240
            if not root_entries and not root_dir_info:
 
2241
                # this specified path is not present at all, skip it.
 
2242
                continue
 
2243
            path_handled = False
 
2244
            for entry in root_entries:
 
2245
                result = _process_entry(entry, root_dir_info)
 
2246
                if result is not None:
 
2247
                    path_handled = True
 
2248
                    if result is not uninteresting:
 
2249
                        yield result
 
2250
            if want_unversioned and not path_handled and root_dir_info:
 
2251
                new_executable = bool(
 
2252
                    stat.S_ISREG(root_dir_info[3].st_mode)
 
2253
                    and stat.S_IEXEC & root_dir_info[3].st_mode)
 
2254
                yield (None,
 
2255
                       (None, current_root_unicode),
 
2256
                       True,
 
2257
                       (False, False),
 
2258
                       (None, None),
 
2259
                       (None, splitpath(current_root_unicode)[-1]),
 
2260
                       (None, root_dir_info[2]),
 
2261
                       (None, new_executable)
 
2262
                      )
 
2263
            initial_key = (current_root, '', '')
 
2264
            block_index, _ = state._find_block_index_from_key(initial_key)
 
2265
            if block_index == 0:
 
2266
                # we have processed the total root already, but because the
 
2267
                # initial key matched it we should skip it here.
 
2268
                block_index +=1
 
2269
            if root_dir_info and root_dir_info[2] == 'tree-reference':
 
2270
                current_dir_info = None
 
2271
            else:
 
2272
                dir_iterator = osutils._walkdirs_utf8(root_abspath, prefix=current_root)
 
2273
                try:
 
2274
                    current_dir_info = dir_iterator.next()
 
2275
                except OSError, e:
 
2276
                    # on win32, python2.4 has e.errno == ERROR_DIRECTORY, but
 
2277
                    # python 2.5 has e.errno == EINVAL,
 
2278
                    #            and e.winerror == ERROR_DIRECTORY
 
2279
                    e_winerror = getattr(e, 'winerror', None)
 
2280
                    win_errors = (ERROR_DIRECTORY, ERROR_PATH_NOT_FOUND)
 
2281
                    # there may be directories in the inventory even though
 
2282
                    # this path is not a file on disk: so mark it as end of
 
2283
                    # iterator
 
2284
                    if e.errno in (errno.ENOENT, errno.ENOTDIR, errno.EINVAL):
 
2285
                        current_dir_info = None
 
2286
                    elif (sys.platform == 'win32'
 
2287
                          and (e.errno in win_errors
 
2288
                               or e_winerror in win_errors)):
 
2289
                        current_dir_info = None
 
2290
                    else:
 
2291
                        raise
 
2292
                else:
 
2293
                    if current_dir_info[0][0] == '':
 
2294
                        # remove .bzr from iteration
 
2295
                        bzr_index = bisect_left(current_dir_info[1], ('.bzr',))
 
2296
                        if current_dir_info[1][bzr_index][0] != '.bzr':
 
2297
                            raise AssertionError()
 
2298
                        del current_dir_info[1][bzr_index]
 
2299
            # walk until both the directory listing and the versioned metadata
 
2300
            # are exhausted. 
 
2301
            if (block_index < len(state._dirblocks) and
 
2302
                osutils.is_inside(current_root, state._dirblocks[block_index][0])):
 
2303
                current_block = state._dirblocks[block_index]
 
2304
            else:
 
2305
                current_block = None
 
2306
            while (current_dir_info is not None or
 
2307
                   current_block is not None):
 
2308
                if (current_dir_info and current_block
 
2309
                    and current_dir_info[0][0] != current_block[0]):
 
2310
                    if cmp_by_dirs(current_dir_info[0][0], current_block[0]) < 0:
 
2311
                        # filesystem data refers to paths not covered by the dirblock.
 
2312
                        # this has two possibilities:
 
2313
                        # A) it is versioned but empty, so there is no block for it
 
2314
                        # B) it is not versioned.
 
2315
 
 
2316
                        # if (A) then we need to recurse into it to check for
 
2317
                        # new unknown files or directories.
 
2318
                        # if (B) then we should ignore it, because we don't
 
2319
                        # recurse into unknown directories.
 
2320
                        path_index = 0
 
2321
                        while path_index < len(current_dir_info[1]):
 
2322
                                current_path_info = current_dir_info[1][path_index]
 
2323
                                if want_unversioned:
 
2324
                                    if current_path_info[2] == 'directory':
 
2325
                                        if self.target._directory_is_tree_reference(
 
2326
                                            current_path_info[0].decode('utf8')):
 
2327
                                            current_path_info = current_path_info[:2] + \
 
2328
                                                ('tree-reference',) + current_path_info[3:]
 
2329
                                    new_executable = bool(
 
2330
                                        stat.S_ISREG(current_path_info[3].st_mode)
 
2331
                                        and stat.S_IEXEC & current_path_info[3].st_mode)
 
2332
                                    yield (None,
 
2333
                                        (None, utf8_decode(current_path_info[0])[0]),
 
2334
                                        True,
 
2335
                                        (False, False),
 
2336
                                        (None, None),
 
2337
                                        (None, utf8_decode(current_path_info[1])[0]),
 
2338
                                        (None, current_path_info[2]),
 
2339
                                        (None, new_executable))
 
2340
                                # dont descend into this unversioned path if it is
 
2341
                                # a dir
 
2342
                                if current_path_info[2] in ('directory',
 
2343
                                                            'tree-reference'):
 
2344
                                    del current_dir_info[1][path_index]
 
2345
                                    path_index -= 1
 
2346
                                path_index += 1
 
2347
 
 
2348
                        # This dir info has been handled, go to the next
 
2349
                        try:
 
2350
                            current_dir_info = dir_iterator.next()
 
2351
                        except StopIteration:
 
2352
                            current_dir_info = None
 
2353
                    else:
 
2354
                        # We have a dirblock entry for this location, but there
 
2355
                        # is no filesystem path for this. This is most likely
 
2356
                        # because a directory was removed from the disk.
 
2357
                        # We don't have to report the missing directory,
 
2358
                        # because that should have already been handled, but we
 
2359
                        # need to handle all of the files that are contained
 
2360
                        # within.
 
2361
                        for current_entry in current_block[1]:
 
2362
                            # entry referring to file not present on disk.
 
2363
                            # advance the entry only, after processing.
 
2364
                            result = _process_entry(current_entry, None)
 
2365
                            if result is not None:
 
2366
                                if result is not uninteresting:
 
2367
                                    yield result
 
2368
                        block_index +=1
 
2369
                        if (block_index < len(state._dirblocks) and
 
2370
                            osutils.is_inside(current_root,
 
2371
                                              state._dirblocks[block_index][0])):
 
2372
                            current_block = state._dirblocks[block_index]
 
2373
                        else:
 
2374
                            current_block = None
 
2375
                    continue
 
2376
                entry_index = 0
 
2377
                if current_block and entry_index < len(current_block[1]):
 
2378
                    current_entry = current_block[1][entry_index]
 
2379
                else:
 
2380
                    current_entry = None
 
2381
                advance_entry = True
 
2382
                path_index = 0
 
2383
                if current_dir_info and path_index < len(current_dir_info[1]):
 
2384
                    current_path_info = current_dir_info[1][path_index]
 
2385
                    if current_path_info[2] == 'directory':
 
2386
                        if self.target._directory_is_tree_reference(
 
2387
                            current_path_info[0].decode('utf8')):
 
2388
                            current_path_info = current_path_info[:2] + \
 
2389
                                ('tree-reference',) + current_path_info[3:]
 
2390
                else:
 
2391
                    current_path_info = None
 
2392
                advance_path = True
 
2393
                path_handled = False
 
2394
                while (current_entry is not None or
 
2395
                    current_path_info is not None):
 
2396
                    if current_entry is None:
 
2397
                        # the check for path_handled when the path is adnvaced
 
2398
                        # will yield this path if needed.
 
2399
                        pass
 
2400
                    elif current_path_info is None:
 
2401
                        # no path is fine: the per entry code will handle it.
 
2402
                        result = _process_entry(current_entry, current_path_info)
 
2403
                        if result is not None:
 
2404
                            if result is not uninteresting:
 
2405
                                yield result
 
2406
                    elif (current_entry[0][1] != current_path_info[1]
 
2407
                          or current_entry[1][target_index][0] in 'ar'):
 
2408
                        # The current path on disk doesn't match the dirblock
 
2409
                        # record. Either the dirblock is marked as absent, or
 
2410
                        # the file on disk is not present at all in the
 
2411
                        # dirblock. Either way, report about the dirblock
 
2412
                        # entry, and let other code handle the filesystem one.
 
2413
 
 
2414
                        # Compare the basename for these files to determine
 
2415
                        # which comes first
 
2416
                        if current_path_info[1] < current_entry[0][1]:
 
2417
                            # extra file on disk: pass for now, but only
 
2418
                            # increment the path, not the entry
 
2419
                            advance_entry = False
 
2420
                        else:
 
2421
                            # entry referring to file not present on disk.
 
2422
                            # advance the entry only, after processing.
 
2423
                            result = _process_entry(current_entry, None)
 
2424
                            if result is not None:
 
2425
                                if result is not uninteresting:
 
2426
                                    yield result
 
2427
                            advance_path = False
 
2428
                    else:
 
2429
                        result = _process_entry(current_entry, current_path_info)
 
2430
                        if result is not None:
 
2431
                            path_handled = True
 
2432
                            if result is not uninteresting:
 
2433
                                yield result
 
2434
                    if advance_entry and current_entry is not None:
 
2435
                        entry_index += 1
 
2436
                        if entry_index < len(current_block[1]):
 
2437
                            current_entry = current_block[1][entry_index]
 
2438
                        else:
 
2439
                            current_entry = None
 
2440
                    else:
 
2441
                        advance_entry = True # reset the advance flaga
 
2442
                    if advance_path and current_path_info is not None:
 
2443
                        if not path_handled:
 
2444
                            # unversioned in all regards
 
2445
                            if want_unversioned:
 
2446
                                new_executable = bool(
 
2447
                                    stat.S_ISREG(current_path_info[3].st_mode)
 
2448
                                    and stat.S_IEXEC & current_path_info[3].st_mode)
 
2449
                                yield (None,
 
2450
                                    (None, utf8_decode(current_path_info[0])[0]),
 
2451
                                    True,
 
2452
                                    (False, False),
 
2453
                                    (None, None),
 
2454
                                    (None, utf8_decode(current_path_info[1])[0]),
 
2455
                                    (None, current_path_info[2]),
 
2456
                                    (None, new_executable))
 
2457
                            # dont descend into this unversioned path if it is
 
2458
                            # a dir
 
2459
                            if current_path_info[2] in ('directory'):
 
2460
                                del current_dir_info[1][path_index]
 
2461
                                path_index -= 1
 
2462
                        # dont descend the disk iterator into any tree 
 
2463
                        # paths.
 
2464
                        if current_path_info[2] == 'tree-reference':
 
2465
                            del current_dir_info[1][path_index]
 
2466
                            path_index -= 1
 
2467
                        path_index += 1
 
2468
                        if path_index < len(current_dir_info[1]):
 
2469
                            current_path_info = current_dir_info[1][path_index]
 
2470
                            if current_path_info[2] == 'directory':
 
2471
                                if self.target._directory_is_tree_reference(
 
2472
                                    current_path_info[0].decode('utf8')):
 
2473
                                    current_path_info = current_path_info[:2] + \
 
2474
                                        ('tree-reference',) + current_path_info[3:]
 
2475
                        else:
 
2476
                            current_path_info = None
 
2477
                        path_handled = False
 
2478
                    else:
 
2479
                        advance_path = True # reset the advance flagg.
 
2480
                if current_block is not None:
 
2481
                    block_index += 1
 
2482
                    if (block_index < len(state._dirblocks) and
 
2483
                        osutils.is_inside(current_root, state._dirblocks[block_index][0])):
 
2484
                        current_block = state._dirblocks[block_index]
 
2485
                    else:
 
2486
                        current_block = None
 
2487
                if current_dir_info is not None:
 
2488
                    try:
 
2489
                        current_dir_info = dir_iterator.next()
 
2490
                    except StopIteration:
 
2491
                        current_dir_info = None
 
2492
 
2116
2493
 
2117
2494
    @staticmethod
2118
2495
    def is_compatible(source, target):
2119
2496
        # the target must be a dirstate working tree
2120
 
        if not isinstance(target, DirStateWorkingTree):
 
2497
        if not isinstance(target, WorkingTree4):
2121
2498
            return False
2122
 
        # the source must be a revtree or dirstate rev tree.
 
2499
        # the source must be a revtreee or dirstate rev tree.
2123
2500
        if not isinstance(source,
2124
2501
            (revisiontree.RevisionTree, DirStateRevisionTree)):
2125
2502
            return False
2126
2503
        # the source revid must be in the target dirstate
2127
 
        if not (source._revision_id == _mod_revision.NULL_REVISION or
 
2504
        if not (source._revision_id == NULL_REVISION or
2128
2505
            source._revision_id in target.get_parent_ids()):
2129
 
            # TODO: what about ghosts? it may well need to
 
2506
            # TODO: what about ghosts? it may well need to 
2130
2507
            # check for them explicitly.
2131
2508
            return False
2132
2509
        return True
2142
2519
 
2143
2520
    def convert(self, tree):
2144
2521
        # lock the control files not the tree, so that we dont get tree
2145
 
        # on-unlock behaviours, and so that noone else diddles with the
 
2522
        # on-unlock behaviours, and so that noone else diddles with the 
2146
2523
        # tree during upgrade.
2147
2524
        tree._control_files.lock_write()
2148
2525
        try:
2177
2554
        tree._transport.put_bytes('format',
2178
2555
            self.target_format.get_format_string(),
2179
2556
            mode=tree.bzrdir._get_file_mode())
2180
 
 
2181
 
 
2182
 
class Converter4to5(object):
2183
 
    """Perform an in-place upgrade of format 4 to format 5 trees."""
2184
 
 
2185
 
    def __init__(self):
2186
 
        self.target_format = WorkingTreeFormat5()
2187
 
 
2188
 
    def convert(self, tree):
2189
 
        # lock the control files not the tree, so that we don't get tree
2190
 
        # on-unlock behaviours, and so that no-one else diddles with the
2191
 
        # tree during upgrade.
2192
 
        tree._control_files.lock_write()
2193
 
        try:
2194
 
            self.update_format(tree)
2195
 
        finally:
2196
 
            tree._control_files.unlock()
2197
 
 
2198
 
    def update_format(self, tree):
2199
 
        """Change the format marker."""
2200
 
        tree._transport.put_bytes('format',
2201
 
            self.target_format.get_format_string(),
2202
 
            mode=tree.bzrdir._get_file_mode())
2203
 
 
2204
 
 
2205
 
class Converter4or5to6(object):
2206
 
    """Perform an in-place upgrade of format 4 or 5 to format 6 trees."""
2207
 
 
2208
 
    def __init__(self):
2209
 
        self.target_format = WorkingTreeFormat6()
2210
 
 
2211
 
    def convert(self, tree):
2212
 
        # lock the control files not the tree, so that we don't get tree
2213
 
        # on-unlock behaviours, and so that no-one else diddles with the
2214
 
        # tree during upgrade.
2215
 
        tree._control_files.lock_write()
2216
 
        try:
2217
 
            self.init_custom_control_files(tree)
2218
 
            self.update_format(tree)
2219
 
        finally:
2220
 
            tree._control_files.unlock()
2221
 
 
2222
 
    def init_custom_control_files(self, tree):
2223
 
        """Initialize custom control files."""
2224
 
        tree._transport.put_bytes('views', '',
2225
 
            mode=tree.bzrdir._get_file_mode())
2226
 
 
2227
 
    def update_format(self, tree):
2228
 
        """Change the format marker."""
2229
 
        tree._transport.put_bytes('format',
2230
 
            self.target_format.get_format_string(),
2231
 
            mode=tree.bzrdir._get_file_mode())