~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transform.py

  • Committer: Canonical.com Patch Queue Manager
  • Date: 2009-02-18 13:27:08 UTC
  • mfrom: (4011.4.3 ssh-hints)
  • Revision ID: pqm@pqm.ubuntu.com-20090218132708-okubrahz9exvae9r
(Jelmer) Point out bzr+ssh:// to the user when they use ssh://.

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
# Copyright (C) 2006, 2007, 2008 Canonical Ltd
 
2
#
 
3
# This program is free software; you can redistribute it and/or modify
 
4
# it under the terms of the GNU General Public License as published by
 
5
# the Free Software Foundation; either version 2 of the License, or
 
6
# (at your option) any later version.
 
7
#
 
8
# This program is distributed in the hope that it will be useful,
 
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
 
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 
11
# GNU General Public License for more details.
 
12
#
 
13
# You should have received a copy of the GNU General Public License
 
14
# along with this program; if not, write to the Free Software
 
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 
16
 
 
17
import os
 
18
import errno
 
19
from stat import S_ISREG, S_IEXEC
 
20
 
 
21
from bzrlib.lazy_import import lazy_import
 
22
lazy_import(globals(), """
 
23
from bzrlib import (
 
24
    annotate,
 
25
    bzrdir,
 
26
    delta,
 
27
    errors,
 
28
    inventory,
 
29
    multiparent,
 
30
    osutils,
 
31
    revision as _mod_revision,
 
32
    )
 
33
from bzrlib.util import bencode
 
34
""")
 
35
from bzrlib.errors import (DuplicateKey, MalformedTransform, NoSuchFile,
 
36
                           ReusingTransform, NotVersionedError, CantMoveRoot,
 
37
                           ExistingLimbo, ImmortalLimbo, NoFinalPath,
 
38
                           UnableCreateSymlink)
 
39
from bzrlib.inventory import InventoryEntry
 
40
from bzrlib.osutils import (
 
41
    delete_any,
 
42
    file_kind,
 
43
    has_symlinks,
 
44
    lexists,
 
45
    pathjoin,
 
46
    sha_file,
 
47
    splitpath,
 
48
    supports_executable,
 
49
)
 
50
from bzrlib.progress import DummyProgress, ProgressPhase
 
51
from bzrlib.symbol_versioning import (
 
52
        deprecated_function,
 
53
        deprecated_in,
 
54
        )
 
55
from bzrlib.trace import mutter, warning
 
56
from bzrlib import tree
 
57
import bzrlib.ui
 
58
import bzrlib.urlutils as urlutils
 
59
 
 
60
 
 
61
ROOT_PARENT = "root-parent"
 
62
 
 
63
 
 
64
def unique_add(map, key, value):
 
65
    if key in map:
 
66
        raise DuplicateKey(key=key)
 
67
    map[key] = value
 
68
 
 
69
 
 
70
class _TransformResults(object):
 
71
    def __init__(self, modified_paths, rename_count):
 
72
        object.__init__(self)
 
73
        self.modified_paths = modified_paths
 
74
        self.rename_count = rename_count
 
75
 
 
76
 
 
77
class TreeTransformBase(object):
 
78
    """The base class for TreeTransform and TreeTransformBase"""
 
79
 
 
80
    def __init__(self, tree, limbodir, pb=DummyProgress(),
 
81
                 case_sensitive=True):
 
82
        """Constructor.
 
83
 
 
84
        :param tree: The tree that will be transformed, but not necessarily
 
85
            the output tree.
 
86
        :param limbodir: A directory where new files can be stored until
 
87
            they are installed in their proper places
 
88
        :param pb: A ProgressBar indicating how much progress is being made
 
89
        :param case_sensitive: If True, the target of the transform is
 
90
            case sensitive, not just case preserving.
 
91
        """
 
92
        object.__init__(self)
 
93
        self._tree = tree
 
94
        self._limbodir = limbodir
 
95
        self._deletiondir = None
 
96
        self._id_number = 0
 
97
        # mapping of trans_id -> new basename
 
98
        self._new_name = {}
 
99
        # mapping of trans_id -> new parent trans_id
 
100
        self._new_parent = {}
 
101
        # mapping of trans_id with new contents -> new file_kind
 
102
        self._new_contents = {}
 
103
        # A mapping of transform ids to their limbo filename
 
104
        self._limbo_files = {}
 
105
        # A mapping of transform ids to a set of the transform ids of children
 
106
        # that their limbo directory has
 
107
        self._limbo_children = {}
 
108
        # Map transform ids to maps of child filename to child transform id
 
109
        self._limbo_children_names = {}
 
110
        # List of transform ids that need to be renamed from limbo into place
 
111
        self._needs_rename = set()
 
112
        # Set of trans_ids whose contents will be removed
 
113
        self._removed_contents = set()
 
114
        # Mapping of trans_id -> new execute-bit value
 
115
        self._new_executability = {}
 
116
        # Mapping of trans_id -> new tree-reference value
 
117
        self._new_reference_revision = {}
 
118
        # Mapping of trans_id -> new file_id
 
119
        self._new_id = {}
 
120
        # Mapping of old file-id -> trans_id
 
121
        self._non_present_ids = {}
 
122
        # Mapping of new file_id -> trans_id
 
123
        self._r_new_id = {}
 
124
        # Set of trans_ids that will be removed
 
125
        self._removed_id = set()
 
126
        # Mapping of path in old tree -> trans_id
 
127
        self._tree_path_ids = {}
 
128
        # Mapping trans_id -> path in old tree
 
129
        self._tree_id_paths = {}
 
130
        # Cache of realpath results, to speed up canonical_path
 
131
        self._realpaths = {}
 
132
        # Cache of relpath results, to speed up canonical_path
 
133
        self._relpaths = {}
 
134
        # The trans_id that will be used as the tree root
 
135
        root_id = tree.get_root_id()
 
136
        if root_id is not None:
 
137
            self._new_root = self.trans_id_tree_file_id(root_id)
 
138
        else:
 
139
            self._new_root = None
 
140
        # Indictor of whether the transform has been applied
 
141
        self._done = False
 
142
        # A progress bar
 
143
        self._pb = pb
 
144
        # Whether the target is case sensitive
 
145
        self._case_sensitive_target = case_sensitive
 
146
        # A counter of how many files have been renamed
 
147
        self.rename_count = 0
 
148
 
 
149
    def __get_root(self):
 
150
        return self._new_root
 
151
 
 
152
    root = property(__get_root)
 
153
 
 
154
    def finalize(self):
 
155
        """Release the working tree lock, if held, clean up limbo dir.
 
156
 
 
157
        This is required if apply has not been invoked, but can be invoked
 
158
        even after apply.
 
159
        """
 
160
        if self._tree is None:
 
161
            return
 
162
        try:
 
163
            entries = [(self._limbo_name(t), t, k) for t, k in
 
164
                       self._new_contents.iteritems()]
 
165
            entries.sort(reverse=True)
 
166
            for path, trans_id, kind in entries:
 
167
                if kind == "directory":
 
168
                    os.rmdir(path)
 
169
                else:
 
170
                    os.unlink(path)
 
171
            try:
 
172
                os.rmdir(self._limbodir)
 
173
            except OSError:
 
174
                # We don't especially care *why* the dir is immortal.
 
175
                raise ImmortalLimbo(self._limbodir)
 
176
            try:
 
177
                if self._deletiondir is not None:
 
178
                    os.rmdir(self._deletiondir)
 
179
            except OSError:
 
180
                raise errors.ImmortalPendingDeletion(self._deletiondir)
 
181
        finally:
 
182
            self._tree.unlock()
 
183
            self._tree = None
 
184
 
 
185
    def _assign_id(self):
 
186
        """Produce a new tranform id"""
 
187
        new_id = "new-%s" % self._id_number
 
188
        self._id_number +=1
 
189
        return new_id
 
190
 
 
191
    def create_path(self, name, parent):
 
192
        """Assign a transaction id to a new path"""
 
193
        trans_id = self._assign_id()
 
194
        unique_add(self._new_name, trans_id, name)
 
195
        unique_add(self._new_parent, trans_id, parent)
 
196
        return trans_id
 
197
 
 
198
    def adjust_path(self, name, parent, trans_id):
 
199
        """Change the path that is assigned to a transaction id."""
 
200
        if trans_id == self._new_root:
 
201
            raise CantMoveRoot
 
202
        previous_parent = self._new_parent.get(trans_id)
 
203
        previous_name = self._new_name.get(trans_id)
 
204
        self._new_name[trans_id] = name
 
205
        self._new_parent[trans_id] = parent
 
206
        if parent == ROOT_PARENT:
 
207
            if self._new_root is not None:
 
208
                raise ValueError("Cannot have multiple roots.")
 
209
            self._new_root = trans_id
 
210
        if (trans_id in self._limbo_files and
 
211
            trans_id not in self._needs_rename):
 
212
            self._rename_in_limbo([trans_id])
 
213
            self._limbo_children[previous_parent].remove(trans_id)
 
214
            del self._limbo_children_names[previous_parent][previous_name]
 
215
 
 
216
    def _rename_in_limbo(self, trans_ids):
 
217
        """Fix limbo names so that the right final path is produced.
 
218
 
 
219
        This means we outsmarted ourselves-- we tried to avoid renaming
 
220
        these files later by creating them with their final names in their
 
221
        final parents.  But now the previous name or parent is no longer
 
222
        suitable, so we have to rename them.
 
223
 
 
224
        Even for trans_ids that have no new contents, we must remove their
 
225
        entries from _limbo_files, because they are now stale.
 
226
        """
 
227
        for trans_id in trans_ids:
 
228
            old_path = self._limbo_files.pop(trans_id)
 
229
            if trans_id not in self._new_contents:
 
230
                continue
 
231
            new_path = self._limbo_name(trans_id)
 
232
            os.rename(old_path, new_path)
 
233
 
 
234
    def adjust_root_path(self, name, parent):
 
235
        """Emulate moving the root by moving all children, instead.
 
236
        
 
237
        We do this by undoing the association of root's transaction id with the
 
238
        current tree.  This allows us to create a new directory with that
 
239
        transaction id.  We unversion the root directory and version the 
 
240
        physically new directory, and hope someone versions the tree root
 
241
        later.
 
242
        """
 
243
        old_root = self._new_root
 
244
        old_root_file_id = self.final_file_id(old_root)
 
245
        # force moving all children of root
 
246
        for child_id in self.iter_tree_children(old_root):
 
247
            if child_id != parent:
 
248
                self.adjust_path(self.final_name(child_id), 
 
249
                                 self.final_parent(child_id), child_id)
 
250
            file_id = self.final_file_id(child_id)
 
251
            if file_id is not None:
 
252
                self.unversion_file(child_id)
 
253
            self.version_file(file_id, child_id)
 
254
        
 
255
        # the physical root needs a new transaction id
 
256
        self._tree_path_ids.pop("")
 
257
        self._tree_id_paths.pop(old_root)
 
258
        self._new_root = self.trans_id_tree_file_id(self._tree.get_root_id())
 
259
        if parent == old_root:
 
260
            parent = self._new_root
 
261
        self.adjust_path(name, parent, old_root)
 
262
        self.create_directory(old_root)
 
263
        self.version_file(old_root_file_id, old_root)
 
264
        self.unversion_file(self._new_root)
 
265
 
 
266
    def trans_id_tree_file_id(self, inventory_id):
 
267
        """Determine the transaction id of a working tree file.
 
268
        
 
269
        This reflects only files that already exist, not ones that will be
 
270
        added by transactions.
 
271
        """
 
272
        if inventory_id is None:
 
273
            raise ValueError('None is not a valid file id')
 
274
        path = self._tree.id2path(inventory_id)
 
275
        return self.trans_id_tree_path(path)
 
276
 
 
277
    def trans_id_file_id(self, file_id):
 
278
        """Determine or set the transaction id associated with a file ID.
 
279
        A new id is only created for file_ids that were never present.  If
 
280
        a transaction has been unversioned, it is deliberately still returned.
 
281
        (this will likely lead to an unversioned parent conflict.)
 
282
        """
 
283
        if file_id is None:
 
284
            raise ValueError('None is not a valid file id')
 
285
        if file_id in self._r_new_id and self._r_new_id[file_id] is not None:
 
286
            return self._r_new_id[file_id]
 
287
        else:
 
288
            try:
 
289
                self._tree.iter_entries_by_dir([file_id]).next()
 
290
            except StopIteration:
 
291
                if file_id in self._non_present_ids:
 
292
                    return self._non_present_ids[file_id]
 
293
                else:
 
294
                    trans_id = self._assign_id()
 
295
                    self._non_present_ids[file_id] = trans_id
 
296
                    return trans_id
 
297
            else:
 
298
                return self.trans_id_tree_file_id(file_id)
 
299
 
 
300
    def canonical_path(self, path):
 
301
        """Get the canonical tree-relative path"""
 
302
        # don't follow final symlinks
 
303
        abs = self._tree.abspath(path)
 
304
        if abs in self._relpaths:
 
305
            return self._relpaths[abs]
 
306
        dirname, basename = os.path.split(abs)
 
307
        if dirname not in self._realpaths:
 
308
            self._realpaths[dirname] = os.path.realpath(dirname)
 
309
        dirname = self._realpaths[dirname]
 
310
        abs = pathjoin(dirname, basename)
 
311
        if dirname in self._relpaths:
 
312
            relpath = pathjoin(self._relpaths[dirname], basename)
 
313
            relpath = relpath.rstrip('/\\')
 
314
        else:
 
315
            relpath = self._tree.relpath(abs)
 
316
        self._relpaths[abs] = relpath
 
317
        return relpath
 
318
 
 
319
    def trans_id_tree_path(self, path):
 
320
        """Determine (and maybe set) the transaction ID for a tree path."""
 
321
        path = self.canonical_path(path)
 
322
        if path not in self._tree_path_ids:
 
323
            self._tree_path_ids[path] = self._assign_id()
 
324
            self._tree_id_paths[self._tree_path_ids[path]] = path
 
325
        return self._tree_path_ids[path]
 
326
 
 
327
    def get_tree_parent(self, trans_id):
 
328
        """Determine id of the parent in the tree."""
 
329
        path = self._tree_id_paths[trans_id]
 
330
        if path == "":
 
331
            return ROOT_PARENT
 
332
        return self.trans_id_tree_path(os.path.dirname(path))
 
333
 
 
334
    def create_file(self, contents, trans_id, mode_id=None):
 
335
        """Schedule creation of a new file.
 
336
 
 
337
        See also new_file.
 
338
        
 
339
        Contents is an iterator of strings, all of which will be written
 
340
        to the target destination.
 
341
 
 
342
        New file takes the permissions of any existing file with that id,
 
343
        unless mode_id is specified.
 
344
        """
 
345
        name = self._limbo_name(trans_id)
 
346
        f = open(name, 'wb')
 
347
        try:
 
348
            try:
 
349
                unique_add(self._new_contents, trans_id, 'file')
 
350
            except:
 
351
                # Clean up the file, it never got registered so
 
352
                # TreeTransform.finalize() won't clean it up.
 
353
                f.close()
 
354
                os.unlink(name)
 
355
                raise
 
356
 
 
357
            f.writelines(contents)
 
358
        finally:
 
359
            f.close()
 
360
        self._set_mode(trans_id, mode_id, S_ISREG)
 
361
 
 
362
    def _set_mode(self, trans_id, mode_id, typefunc):
 
363
        """Set the mode of new file contents.
 
364
        The mode_id is the existing file to get the mode from (often the same
 
365
        as trans_id).  The operation is only performed if there's a mode match
 
366
        according to typefunc.
 
367
        """
 
368
        if mode_id is None:
 
369
            mode_id = trans_id
 
370
        try:
 
371
            old_path = self._tree_id_paths[mode_id]
 
372
        except KeyError:
 
373
            return
 
374
        try:
 
375
            mode = os.stat(self._tree.abspath(old_path)).st_mode
 
376
        except OSError, e:
 
377
            if e.errno in (errno.ENOENT, errno.ENOTDIR):
 
378
                # Either old_path doesn't exist, or the parent of the
 
379
                # target is not a directory (but will be one eventually)
 
380
                # Either way, we know it doesn't exist *right now*
 
381
                # See also bug #248448
 
382
                return
 
383
            else:
 
384
                raise
 
385
        if typefunc(mode):
 
386
            os.chmod(self._limbo_name(trans_id), mode)
 
387
 
 
388
    def create_hardlink(self, path, trans_id):
 
389
        """Schedule creation of a hard link"""
 
390
        name = self._limbo_name(trans_id)
 
391
        try:
 
392
            os.link(path, name)
 
393
        except OSError, e:
 
394
            if e.errno != errno.EPERM:
 
395
                raise
 
396
            raise errors.HardLinkNotSupported(path)
 
397
        try:
 
398
            unique_add(self._new_contents, trans_id, 'file')
 
399
        except:
 
400
            # Clean up the file, it never got registered so
 
401
            # TreeTransform.finalize() won't clean it up.
 
402
            os.unlink(name)
 
403
            raise
 
404
 
 
405
    def create_directory(self, trans_id):
 
406
        """Schedule creation of a new directory.
 
407
        
 
408
        See also new_directory.
 
409
        """
 
410
        os.mkdir(self._limbo_name(trans_id))
 
411
        unique_add(self._new_contents, trans_id, 'directory')
 
412
 
 
413
    def create_symlink(self, target, trans_id):
 
414
        """Schedule creation of a new symbolic link.
 
415
 
 
416
        target is a bytestring.
 
417
        See also new_symlink.
 
418
        """
 
419
        if has_symlinks():
 
420
            os.symlink(target, self._limbo_name(trans_id))
 
421
            unique_add(self._new_contents, trans_id, 'symlink')
 
422
        else:
 
423
            try:
 
424
                path = FinalPaths(self).get_path(trans_id)
 
425
            except KeyError:
 
426
                path = None
 
427
            raise UnableCreateSymlink(path=path)
 
428
 
 
429
    def cancel_creation(self, trans_id):
 
430
        """Cancel the creation of new file contents."""
 
431
        del self._new_contents[trans_id]
 
432
        children = self._limbo_children.get(trans_id)
 
433
        # if this is a limbo directory with children, move them before removing
 
434
        # the directory
 
435
        if children is not None:
 
436
            self._rename_in_limbo(children)
 
437
            del self._limbo_children[trans_id]
 
438
            del self._limbo_children_names[trans_id]
 
439
        delete_any(self._limbo_name(trans_id))
 
440
 
 
441
    def delete_contents(self, trans_id):
 
442
        """Schedule the contents of a path entry for deletion"""
 
443
        self.tree_kind(trans_id)
 
444
        self._removed_contents.add(trans_id)
 
445
 
 
446
    def cancel_deletion(self, trans_id):
 
447
        """Cancel a scheduled deletion"""
 
448
        self._removed_contents.remove(trans_id)
 
449
 
 
450
    def unversion_file(self, trans_id):
 
451
        """Schedule a path entry to become unversioned"""
 
452
        self._removed_id.add(trans_id)
 
453
 
 
454
    def delete_versioned(self, trans_id):
 
455
        """Delete and unversion a versioned file"""
 
456
        self.delete_contents(trans_id)
 
457
        self.unversion_file(trans_id)
 
458
 
 
459
    def set_executability(self, executability, trans_id):
 
460
        """Schedule setting of the 'execute' bit
 
461
        To unschedule, set to None
 
462
        """
 
463
        if executability is None:
 
464
            del self._new_executability[trans_id]
 
465
        else:
 
466
            unique_add(self._new_executability, trans_id, executability)
 
467
 
 
468
    def set_tree_reference(self, revision_id, trans_id):
 
469
        """Set the reference associated with a directory"""
 
470
        unique_add(self._new_reference_revision, trans_id, revision_id)
 
471
 
 
472
    def version_file(self, file_id, trans_id):
 
473
        """Schedule a file to become versioned."""
 
474
        if file_id is None:
 
475
            raise ValueError()
 
476
        unique_add(self._new_id, trans_id, file_id)
 
477
        unique_add(self._r_new_id, file_id, trans_id)
 
478
 
 
479
    def cancel_versioning(self, trans_id):
 
480
        """Undo a previous versioning of a file"""
 
481
        file_id = self._new_id[trans_id]
 
482
        del self._new_id[trans_id]
 
483
        del self._r_new_id[file_id]
 
484
 
 
485
    def new_paths(self, filesystem_only=False):
 
486
        """Determine the paths of all new and changed files.
 
487
 
 
488
        :param filesystem_only: if True, only calculate values for files
 
489
            that require renames or execute bit changes.
 
490
        """
 
491
        new_ids = set()
 
492
        if filesystem_only:
 
493
            stale_ids = self._needs_rename.difference(self._new_name)
 
494
            stale_ids.difference_update(self._new_parent)
 
495
            stale_ids.difference_update(self._new_contents)
 
496
            stale_ids.difference_update(self._new_id)
 
497
            needs_rename = self._needs_rename.difference(stale_ids)
 
498
            id_sets = (needs_rename, self._new_executability)
 
499
        else:
 
500
            id_sets = (self._new_name, self._new_parent, self._new_contents,
 
501
                       self._new_id, self._new_executability)
 
502
        for id_set in id_sets:
 
503
            new_ids.update(id_set)
 
504
        return sorted(FinalPaths(self).get_paths(new_ids))
 
505
 
 
506
    def _inventory_altered(self):
 
507
        """Get the trans_ids and paths of files needing new inv entries."""
 
508
        new_ids = set()
 
509
        for id_set in [self._new_name, self._new_parent, self._new_id,
 
510
                       self._new_executability]:
 
511
            new_ids.update(id_set)
 
512
        changed_kind = set(self._removed_contents)
 
513
        changed_kind.intersection_update(self._new_contents)
 
514
        changed_kind.difference_update(new_ids)
 
515
        changed_kind = (t for t in changed_kind if self.tree_kind(t) !=
 
516
                        self.final_kind(t))
 
517
        new_ids.update(changed_kind)
 
518
        return sorted(FinalPaths(self).get_paths(new_ids))
 
519
 
 
520
    def tree_kind(self, trans_id):
 
521
        """Determine the file kind in the working tree.
 
522
 
 
523
        Raises NoSuchFile if the file does not exist
 
524
        """
 
525
        path = self._tree_id_paths.get(trans_id)
 
526
        if path is None:
 
527
            raise NoSuchFile(None)
 
528
        try:
 
529
            return file_kind(self._tree.abspath(path))
 
530
        except OSError, e:
 
531
            if e.errno != errno.ENOENT:
 
532
                raise
 
533
            else:
 
534
                raise NoSuchFile(path)
 
535
 
 
536
    def final_kind(self, trans_id):
 
537
        """Determine the final file kind, after any changes applied.
 
538
        
 
539
        Raises NoSuchFile if the file does not exist/has no contents.
 
540
        (It is conceivable that a path would be created without the
 
541
        corresponding contents insertion command)
 
542
        """
 
543
        if trans_id in self._new_contents:
 
544
            return self._new_contents[trans_id]
 
545
        elif trans_id in self._removed_contents:
 
546
            raise NoSuchFile(None)
 
547
        else:
 
548
            return self.tree_kind(trans_id)
 
549
 
 
550
    def tree_file_id(self, trans_id):
 
551
        """Determine the file id associated with the trans_id in the tree"""
 
552
        try:
 
553
            path = self._tree_id_paths[trans_id]
 
554
        except KeyError:
 
555
            # the file is a new, unversioned file, or invalid trans_id
 
556
            return None
 
557
        # the file is old; the old id is still valid
 
558
        if self._new_root == trans_id:
 
559
            return self._tree.get_root_id()
 
560
        return self._tree.path2id(path)
 
561
 
 
562
    def final_file_id(self, trans_id):
 
563
        """Determine the file id after any changes are applied, or None.
 
564
        
 
565
        None indicates that the file will not be versioned after changes are
 
566
        applied.
 
567
        """
 
568
        try:
 
569
            return self._new_id[trans_id]
 
570
        except KeyError:
 
571
            if trans_id in self._removed_id:
 
572
                return None
 
573
        return self.tree_file_id(trans_id)
 
574
 
 
575
    def inactive_file_id(self, trans_id):
 
576
        """Return the inactive file_id associated with a transaction id.
 
577
        That is, the one in the tree or in non_present_ids.
 
578
        The file_id may actually be active, too.
 
579
        """
 
580
        file_id = self.tree_file_id(trans_id)
 
581
        if file_id is not None:
 
582
            return file_id
 
583
        for key, value in self._non_present_ids.iteritems():
 
584
            if value == trans_id:
 
585
                return key
 
586
 
 
587
    def final_parent(self, trans_id):
 
588
        """Determine the parent file_id, after any changes are applied.
 
589
 
 
590
        ROOT_PARENT is returned for the tree root.
 
591
        """
 
592
        try:
 
593
            return self._new_parent[trans_id]
 
594
        except KeyError:
 
595
            return self.get_tree_parent(trans_id)
 
596
 
 
597
    def final_name(self, trans_id):
 
598
        """Determine the final filename, after all changes are applied."""
 
599
        try:
 
600
            return self._new_name[trans_id]
 
601
        except KeyError:
 
602
            try:
 
603
                return os.path.basename(self._tree_id_paths[trans_id])
 
604
            except KeyError:
 
605
                raise NoFinalPath(trans_id, self)
 
606
 
 
607
    def by_parent(self):
 
608
        """Return a map of parent: children for known parents.
 
609
        
 
610
        Only new paths and parents of tree files with assigned ids are used.
 
611
        """
 
612
        by_parent = {}
 
613
        items = list(self._new_parent.iteritems())
 
614
        items.extend((t, self.final_parent(t)) for t in 
 
615
                      self._tree_id_paths.keys())
 
616
        for trans_id, parent_id in items:
 
617
            if parent_id not in by_parent:
 
618
                by_parent[parent_id] = set()
 
619
            by_parent[parent_id].add(trans_id)
 
620
        return by_parent
 
621
 
 
622
    def path_changed(self, trans_id):
 
623
        """Return True if a trans_id's path has changed."""
 
624
        return (trans_id in self._new_name) or (trans_id in self._new_parent)
 
625
 
 
626
    def new_contents(self, trans_id):
 
627
        return (trans_id in self._new_contents)
 
628
 
 
629
    def find_conflicts(self):
 
630
        """Find any violations of inventory or filesystem invariants"""
 
631
        if self._done is True:
 
632
            raise ReusingTransform()
 
633
        conflicts = []
 
634
        # ensure all children of all existent parents are known
 
635
        # all children of non-existent parents are known, by definition.
 
636
        self._add_tree_children()
 
637
        by_parent = self.by_parent()
 
638
        conflicts.extend(self._unversioned_parents(by_parent))
 
639
        conflicts.extend(self._parent_loops())
 
640
        conflicts.extend(self._duplicate_entries(by_parent))
 
641
        conflicts.extend(self._duplicate_ids())
 
642
        conflicts.extend(self._parent_type_conflicts(by_parent))
 
643
        conflicts.extend(self._improper_versioning())
 
644
        conflicts.extend(self._executability_conflicts())
 
645
        conflicts.extend(self._overwrite_conflicts())
 
646
        return conflicts
 
647
 
 
648
    def _add_tree_children(self):
 
649
        """Add all the children of all active parents to the known paths.
 
650
 
 
651
        Active parents are those which gain children, and those which are
 
652
        removed.  This is a necessary first step in detecting conflicts.
 
653
        """
 
654
        parents = self.by_parent().keys()
 
655
        parents.extend([t for t in self._removed_contents if 
 
656
                        self.tree_kind(t) == 'directory'])
 
657
        for trans_id in self._removed_id:
 
658
            file_id = self.tree_file_id(trans_id)
 
659
            if file_id is not None:
 
660
                if self._tree.inventory[file_id].kind == 'directory':
 
661
                    parents.append(trans_id)
 
662
            elif self.tree_kind(trans_id) == 'directory':
 
663
                parents.append(trans_id)
 
664
 
 
665
        for parent_id in parents:
 
666
            # ensure that all children are registered with the transaction
 
667
            list(self.iter_tree_children(parent_id))
 
668
 
 
669
    def iter_tree_children(self, parent_id):
 
670
        """Iterate through the entry's tree children, if any"""
 
671
        try:
 
672
            path = self._tree_id_paths[parent_id]
 
673
        except KeyError:
 
674
            return
 
675
        try:
 
676
            children = os.listdir(self._tree.abspath(path))
 
677
        except OSError, e:
 
678
            if not (osutils._is_error_enotdir(e)
 
679
                    or e.errno in (errno.ENOENT, errno.ESRCH)):
 
680
                raise
 
681
            return
 
682
 
 
683
        for child in children:
 
684
            childpath = joinpath(path, child)
 
685
            if self._tree.is_control_filename(childpath):
 
686
                continue
 
687
            yield self.trans_id_tree_path(childpath)
 
688
 
 
689
    def has_named_child(self, by_parent, parent_id, name):
 
690
        try:
 
691
            children = by_parent[parent_id]
 
692
        except KeyError:
 
693
            children = []
 
694
        for child in children:
 
695
            if self.final_name(child) == name:
 
696
                return True
 
697
        try:
 
698
            path = self._tree_id_paths[parent_id]
 
699
        except KeyError:
 
700
            return False
 
701
        childpath = joinpath(path, name)
 
702
        child_id = self._tree_path_ids.get(childpath)
 
703
        if child_id is None:
 
704
            return lexists(self._tree.abspath(childpath))
 
705
        else:
 
706
            if self.final_parent(child_id) != parent_id:
 
707
                return False
 
708
            if child_id in self._removed_contents:
 
709
                # XXX What about dangling file-ids?
 
710
                return False
 
711
            else:
 
712
                return True
 
713
 
 
714
    def _parent_loops(self):
 
715
        """No entry should be its own ancestor"""
 
716
        conflicts = []
 
717
        for trans_id in self._new_parent:
 
718
            seen = set()
 
719
            parent_id = trans_id
 
720
            while parent_id is not ROOT_PARENT:
 
721
                seen.add(parent_id)
 
722
                try:
 
723
                    parent_id = self.final_parent(parent_id)
 
724
                except KeyError:
 
725
                    break
 
726
                if parent_id == trans_id:
 
727
                    conflicts.append(('parent loop', trans_id))
 
728
                if parent_id in seen:
 
729
                    break
 
730
        return conflicts
 
731
 
 
732
    def _unversioned_parents(self, by_parent):
 
733
        """If parent directories are versioned, children must be versioned."""
 
734
        conflicts = []
 
735
        for parent_id, children in by_parent.iteritems():
 
736
            if parent_id is ROOT_PARENT:
 
737
                continue
 
738
            if self.final_file_id(parent_id) is not None:
 
739
                continue
 
740
            for child_id in children:
 
741
                if self.final_file_id(child_id) is not None:
 
742
                    conflicts.append(('unversioned parent', parent_id))
 
743
                    break;
 
744
        return conflicts
 
745
 
 
746
    def _improper_versioning(self):
 
747
        """Cannot version a file with no contents, or a bad type.
 
748
        
 
749
        However, existing entries with no contents are okay.
 
750
        """
 
751
        conflicts = []
 
752
        for trans_id in self._new_id.iterkeys():
 
753
            try:
 
754
                kind = self.final_kind(trans_id)
 
755
            except NoSuchFile:
 
756
                conflicts.append(('versioning no contents', trans_id))
 
757
                continue
 
758
            if not InventoryEntry.versionable_kind(kind):
 
759
                conflicts.append(('versioning bad kind', trans_id, kind))
 
760
        return conflicts
 
761
 
 
762
    def _executability_conflicts(self):
 
763
        """Check for bad executability changes.
 
764
        
 
765
        Only versioned files may have their executability set, because
 
766
        1. only versioned entries can have executability under windows
 
767
        2. only files can be executable.  (The execute bit on a directory
 
768
           does not indicate searchability)
 
769
        """
 
770
        conflicts = []
 
771
        for trans_id in self._new_executability:
 
772
            if self.final_file_id(trans_id) is None:
 
773
                conflicts.append(('unversioned executability', trans_id))
 
774
            else:
 
775
                try:
 
776
                    non_file = self.final_kind(trans_id) != "file"
 
777
                except NoSuchFile:
 
778
                    non_file = True
 
779
                if non_file is True:
 
780
                    conflicts.append(('non-file executability', trans_id))
 
781
        return conflicts
 
782
 
 
783
    def _overwrite_conflicts(self):
 
784
        """Check for overwrites (not permitted on Win32)"""
 
785
        conflicts = []
 
786
        for trans_id in self._new_contents:
 
787
            try:
 
788
                self.tree_kind(trans_id)
 
789
            except NoSuchFile:
 
790
                continue
 
791
            if trans_id not in self._removed_contents:
 
792
                conflicts.append(('overwrite', trans_id,
 
793
                                 self.final_name(trans_id)))
 
794
        return conflicts
 
795
 
 
796
    def _duplicate_entries(self, by_parent):
 
797
        """No directory may have two entries with the same name."""
 
798
        conflicts = []
 
799
        if (self._new_name, self._new_parent) == ({}, {}):
 
800
            return conflicts
 
801
        for children in by_parent.itervalues():
 
802
            name_ids = [(self.final_name(t), t) for t in children]
 
803
            if not self._case_sensitive_target:
 
804
                name_ids = [(n.lower(), t) for n, t in name_ids]
 
805
            name_ids.sort()
 
806
            last_name = None
 
807
            last_trans_id = None
 
808
            for name, trans_id in name_ids:
 
809
                try:
 
810
                    kind = self.final_kind(trans_id)
 
811
                except NoSuchFile:
 
812
                    kind = None
 
813
                file_id = self.final_file_id(trans_id)
 
814
                if kind is None and file_id is None:
 
815
                    continue
 
816
                if name == last_name:
 
817
                    conflicts.append(('duplicate', last_trans_id, trans_id,
 
818
                    name))
 
819
                last_name = name
 
820
                last_trans_id = trans_id
 
821
        return conflicts
 
822
 
 
823
    def _duplicate_ids(self):
 
824
        """Each inventory id may only be used once"""
 
825
        conflicts = []
 
826
        removed_tree_ids = set((self.tree_file_id(trans_id) for trans_id in
 
827
                                self._removed_id))
 
828
        all_ids = self._tree.all_file_ids()
 
829
        active_tree_ids = all_ids.difference(removed_tree_ids)
 
830
        for trans_id, file_id in self._new_id.iteritems():
 
831
            if file_id in active_tree_ids:
 
832
                old_trans_id = self.trans_id_tree_file_id(file_id)
 
833
                conflicts.append(('duplicate id', old_trans_id, trans_id))
 
834
        return conflicts
 
835
 
 
836
    def _parent_type_conflicts(self, by_parent):
 
837
        """parents must have directory 'contents'."""
 
838
        conflicts = []
 
839
        for parent_id, children in by_parent.iteritems():
 
840
            if parent_id is ROOT_PARENT:
 
841
                continue
 
842
            if not self._any_contents(children):
 
843
                continue
 
844
            for child in children:
 
845
                try:
 
846
                    self.final_kind(child)
 
847
                except NoSuchFile:
 
848
                    continue
 
849
            try:
 
850
                kind = self.final_kind(parent_id)
 
851
            except NoSuchFile:
 
852
                kind = None
 
853
            if kind is None:
 
854
                conflicts.append(('missing parent', parent_id))
 
855
            elif kind != "directory":
 
856
                conflicts.append(('non-directory parent', parent_id))
 
857
        return conflicts
 
858
 
 
859
    def _any_contents(self, trans_ids):
 
860
        """Return true if any of the trans_ids, will have contents."""
 
861
        for trans_id in trans_ids:
 
862
            try:
 
863
                kind = self.final_kind(trans_id)
 
864
            except NoSuchFile:
 
865
                continue
 
866
            return True
 
867
        return False
 
868
 
 
869
    def _limbo_name(self, trans_id):
 
870
        """Generate the limbo name of a file"""
 
871
        limbo_name = self._limbo_files.get(trans_id)
 
872
        if limbo_name is not None:
 
873
            return limbo_name
 
874
        parent = self._new_parent.get(trans_id)
 
875
        # if the parent directory is already in limbo (e.g. when building a
 
876
        # tree), choose a limbo name inside the parent, to reduce further
 
877
        # renames.
 
878
        use_direct_path = False
 
879
        if self._new_contents.get(parent) == 'directory':
 
880
            filename = self._new_name.get(trans_id)
 
881
            if filename is not None:
 
882
                if parent not in self._limbo_children:
 
883
                    self._limbo_children[parent] = set()
 
884
                    self._limbo_children_names[parent] = {}
 
885
                    use_direct_path = True
 
886
                # the direct path can only be used if no other file has
 
887
                # already taken this pathname, i.e. if the name is unused, or
 
888
                # if it is already associated with this trans_id.
 
889
                elif self._case_sensitive_target:
 
890
                    if (self._limbo_children_names[parent].get(filename)
 
891
                        in (trans_id, None)):
 
892
                        use_direct_path = True
 
893
                else:
 
894
                    for l_filename, l_trans_id in\
 
895
                        self._limbo_children_names[parent].iteritems():
 
896
                        if l_trans_id == trans_id:
 
897
                            continue
 
898
                        if l_filename.lower() == filename.lower():
 
899
                            break
 
900
                    else:
 
901
                        use_direct_path = True
 
902
 
 
903
        if use_direct_path:
 
904
            limbo_name = pathjoin(self._limbo_files[parent], filename)
 
905
            self._limbo_children[parent].add(trans_id)
 
906
            self._limbo_children_names[parent][filename] = trans_id
 
907
        else:
 
908
            limbo_name = pathjoin(self._limbodir, trans_id)
 
909
            self._needs_rename.add(trans_id)
 
910
        self._limbo_files[trans_id] = limbo_name
 
911
        return limbo_name
 
912
 
 
913
    def _set_executability(self, path, trans_id):
 
914
        """Set the executability of versioned files """
 
915
        if supports_executable():
 
916
            new_executability = self._new_executability[trans_id]
 
917
            abspath = self._tree.abspath(path)
 
918
            current_mode = os.stat(abspath).st_mode
 
919
            if new_executability:
 
920
                umask = os.umask(0)
 
921
                os.umask(umask)
 
922
                to_mode = current_mode | (0100 & ~umask)
 
923
                # Enable x-bit for others only if they can read it.
 
924
                if current_mode & 0004:
 
925
                    to_mode |= 0001 & ~umask
 
926
                if current_mode & 0040:
 
927
                    to_mode |= 0010 & ~umask
 
928
            else:
 
929
                to_mode = current_mode & ~0111
 
930
            os.chmod(abspath, to_mode)
 
931
 
 
932
    def _new_entry(self, name, parent_id, file_id):
 
933
        """Helper function to create a new filesystem entry."""
 
934
        trans_id = self.create_path(name, parent_id)
 
935
        if file_id is not None:
 
936
            self.version_file(file_id, trans_id)
 
937
        return trans_id
 
938
 
 
939
    def new_file(self, name, parent_id, contents, file_id=None, 
 
940
                 executable=None):
 
941
        """Convenience method to create files.
 
942
        
 
943
        name is the name of the file to create.
 
944
        parent_id is the transaction id of the parent directory of the file.
 
945
        contents is an iterator of bytestrings, which will be used to produce
 
946
        the file.
 
947
        :param file_id: The inventory ID of the file, if it is to be versioned.
 
948
        :param executable: Only valid when a file_id has been supplied.
 
949
        """
 
950
        trans_id = self._new_entry(name, parent_id, file_id)
 
951
        # TODO: rather than scheduling a set_executable call,
 
952
        # have create_file create the file with the right mode.
 
953
        self.create_file(contents, trans_id)
 
954
        if executable is not None:
 
955
            self.set_executability(executable, trans_id)
 
956
        return trans_id
 
957
 
 
958
    def new_directory(self, name, parent_id, file_id=None):
 
959
        """Convenience method to create directories.
 
960
 
 
961
        name is the name of the directory to create.
 
962
        parent_id is the transaction id of the parent directory of the
 
963
        directory.
 
964
        file_id is the inventory ID of the directory, if it is to be versioned.
 
965
        """
 
966
        trans_id = self._new_entry(name, parent_id, file_id)
 
967
        self.create_directory(trans_id)
 
968
        return trans_id 
 
969
 
 
970
    def new_symlink(self, name, parent_id, target, file_id=None):
 
971
        """Convenience method to create symbolic link.
 
972
        
 
973
        name is the name of the symlink to create.
 
974
        parent_id is the transaction id of the parent directory of the symlink.
 
975
        target is a bytestring of the target of the symlink.
 
976
        file_id is the inventory ID of the file, if it is to be versioned.
 
977
        """
 
978
        trans_id = self._new_entry(name, parent_id, file_id)
 
979
        self.create_symlink(target, trans_id)
 
980
        return trans_id
 
981
 
 
982
    def _affected_ids(self):
 
983
        """Return the set of transform ids affected by the transform"""
 
984
        trans_ids = set(self._removed_id)
 
985
        trans_ids.update(self._new_id.keys())
 
986
        trans_ids.update(self._removed_contents)
 
987
        trans_ids.update(self._new_contents.keys())
 
988
        trans_ids.update(self._new_executability.keys())
 
989
        trans_ids.update(self._new_name.keys())
 
990
        trans_ids.update(self._new_parent.keys())
 
991
        return trans_ids
 
992
 
 
993
    def _get_file_id_maps(self):
 
994
        """Return mapping of file_ids to trans_ids in the to and from states"""
 
995
        trans_ids = self._affected_ids()
 
996
        from_trans_ids = {}
 
997
        to_trans_ids = {}
 
998
        # Build up two dicts: trans_ids associated with file ids in the
 
999
        # FROM state, vs the TO state.
 
1000
        for trans_id in trans_ids:
 
1001
            from_file_id = self.tree_file_id(trans_id)
 
1002
            if from_file_id is not None:
 
1003
                from_trans_ids[from_file_id] = trans_id
 
1004
            to_file_id = self.final_file_id(trans_id)
 
1005
            if to_file_id is not None:
 
1006
                to_trans_ids[to_file_id] = trans_id
 
1007
        return from_trans_ids, to_trans_ids
 
1008
 
 
1009
    def _from_file_data(self, from_trans_id, from_versioned, file_id):
 
1010
        """Get data about a file in the from (tree) state
 
1011
 
 
1012
        Return a (name, parent, kind, executable) tuple
 
1013
        """
 
1014
        from_path = self._tree_id_paths.get(from_trans_id)
 
1015
        if from_versioned:
 
1016
            # get data from working tree if versioned
 
1017
            from_entry = self._tree.iter_entries_by_dir([file_id]).next()[1]
 
1018
            from_name = from_entry.name
 
1019
            from_parent = from_entry.parent_id
 
1020
        else:
 
1021
            from_entry = None
 
1022
            if from_path is None:
 
1023
                # File does not exist in FROM state
 
1024
                from_name = None
 
1025
                from_parent = None
 
1026
            else:
 
1027
                # File exists, but is not versioned.  Have to use path-
 
1028
                # splitting stuff
 
1029
                from_name = os.path.basename(from_path)
 
1030
                tree_parent = self.get_tree_parent(from_trans_id)
 
1031
                from_parent = self.tree_file_id(tree_parent)
 
1032
        if from_path is not None:
 
1033
            from_kind, from_executable, from_stats = \
 
1034
                self._tree._comparison_data(from_entry, from_path)
 
1035
        else:
 
1036
            from_kind = None
 
1037
            from_executable = False
 
1038
        return from_name, from_parent, from_kind, from_executable
 
1039
 
 
1040
    def _to_file_data(self, to_trans_id, from_trans_id, from_executable):
 
1041
        """Get data about a file in the to (target) state
 
1042
 
 
1043
        Return a (name, parent, kind, executable) tuple
 
1044
        """
 
1045
        to_name = self.final_name(to_trans_id)
 
1046
        try:
 
1047
            to_kind = self.final_kind(to_trans_id)
 
1048
        except NoSuchFile:
 
1049
            to_kind = None
 
1050
        to_parent = self.final_file_id(self.final_parent(to_trans_id))
 
1051
        if to_trans_id in self._new_executability:
 
1052
            to_executable = self._new_executability[to_trans_id]
 
1053
        elif to_trans_id == from_trans_id:
 
1054
            to_executable = from_executable
 
1055
        else:
 
1056
            to_executable = False
 
1057
        return to_name, to_parent, to_kind, to_executable
 
1058
 
 
1059
    def iter_changes(self):
 
1060
        """Produce output in the same format as Tree.iter_changes.
 
1061
 
 
1062
        Will produce nonsensical results if invoked while inventory/filesystem
 
1063
        conflicts (as reported by TreeTransform.find_conflicts()) are present.
 
1064
 
 
1065
        This reads the Transform, but only reproduces changes involving a
 
1066
        file_id.  Files that are not versioned in either of the FROM or TO
 
1067
        states are not reflected.
 
1068
        """
 
1069
        final_paths = FinalPaths(self)
 
1070
        from_trans_ids, to_trans_ids = self._get_file_id_maps()
 
1071
        results = []
 
1072
        # Now iterate through all active file_ids
 
1073
        for file_id in set(from_trans_ids.keys() + to_trans_ids.keys()):
 
1074
            modified = False
 
1075
            from_trans_id = from_trans_ids.get(file_id)
 
1076
            # find file ids, and determine versioning state
 
1077
            if from_trans_id is None:
 
1078
                from_versioned = False
 
1079
                from_trans_id = to_trans_ids[file_id]
 
1080
            else:
 
1081
                from_versioned = True
 
1082
            to_trans_id = to_trans_ids.get(file_id)
 
1083
            if to_trans_id is None:
 
1084
                to_versioned = False
 
1085
                to_trans_id = from_trans_id
 
1086
            else:
 
1087
                to_versioned = True
 
1088
 
 
1089
            from_name, from_parent, from_kind, from_executable = \
 
1090
                self._from_file_data(from_trans_id, from_versioned, file_id)
 
1091
 
 
1092
            to_name, to_parent, to_kind, to_executable = \
 
1093
                self._to_file_data(to_trans_id, from_trans_id, from_executable)
 
1094
 
 
1095
            if not from_versioned:
 
1096
                from_path = None
 
1097
            else:
 
1098
                from_path = self._tree_id_paths.get(from_trans_id)
 
1099
            if not to_versioned:
 
1100
                to_path = None
 
1101
            else:
 
1102
                to_path = final_paths.get_path(to_trans_id)
 
1103
            if from_kind != to_kind:
 
1104
                modified = True
 
1105
            elif to_kind in ('file', 'symlink') and (
 
1106
                to_trans_id != from_trans_id or
 
1107
                to_trans_id in self._new_contents):
 
1108
                modified = True
 
1109
            if (not modified and from_versioned == to_versioned and
 
1110
                from_parent==to_parent and from_name == to_name and
 
1111
                from_executable == to_executable):
 
1112
                continue
 
1113
            results.append((file_id, (from_path, to_path), modified,
 
1114
                   (from_versioned, to_versioned),
 
1115
                   (from_parent, to_parent),
 
1116
                   (from_name, to_name),
 
1117
                   (from_kind, to_kind),
 
1118
                   (from_executable, to_executable)))
 
1119
        return iter(sorted(results, key=lambda x:x[1]))
 
1120
 
 
1121
    def get_preview_tree(self):
 
1122
        """Return a tree representing the result of the transform.
 
1123
 
 
1124
        This tree only supports the subset of Tree functionality required
 
1125
        by show_diff_trees.  It must only be compared to tt._tree.
 
1126
        """
 
1127
        return _PreviewTree(self)
 
1128
 
 
1129
    def _text_parent(self, trans_id):
 
1130
        file_id = self.tree_file_id(trans_id)
 
1131
        try:
 
1132
            if file_id is None or self._tree.kind(file_id) != 'file':
 
1133
                return None
 
1134
        except errors.NoSuchFile:
 
1135
            return None
 
1136
        return file_id
 
1137
 
 
1138
    def _get_parents_texts(self, trans_id):
 
1139
        """Get texts for compression parents of this file."""
 
1140
        file_id = self._text_parent(trans_id)
 
1141
        if file_id is None:
 
1142
            return ()
 
1143
        return (self._tree.get_file_text(file_id),)
 
1144
 
 
1145
    def _get_parents_lines(self, trans_id):
 
1146
        """Get lines for compression parents of this file."""
 
1147
        file_id = self._text_parent(trans_id)
 
1148
        if file_id is None:
 
1149
            return ()
 
1150
        return (self._tree.get_file_lines(file_id),)
 
1151
 
 
1152
    def serialize(self, serializer):
 
1153
        """Serialize this TreeTransform.
 
1154
 
 
1155
        :param serializer: A Serialiser like pack.ContainerSerializer.
 
1156
        """
 
1157
        new_name = dict((k, v.encode('utf-8')) for k, v in
 
1158
                        self._new_name.items())
 
1159
        new_executability = dict((k, int(v)) for k, v in
 
1160
                                 self._new_executability.items())
 
1161
        tree_path_ids = dict((k.encode('utf-8'), v)
 
1162
                             for k, v in self._tree_path_ids.items())
 
1163
        attribs = {
 
1164
            '_id_number': self._id_number,
 
1165
            '_new_name': new_name,
 
1166
            '_new_parent': self._new_parent,
 
1167
            '_new_executability': new_executability,
 
1168
            '_new_id': self._new_id,
 
1169
            '_tree_path_ids': tree_path_ids,
 
1170
            '_removed_id': list(self._removed_id),
 
1171
            '_removed_contents': list(self._removed_contents),
 
1172
            '_non_present_ids': self._non_present_ids,
 
1173
            }
 
1174
        yield serializer.bytes_record(bencode.bencode(attribs),
 
1175
                                      (('attribs',),))
 
1176
        for trans_id, kind in self._new_contents.items():
 
1177
            if kind == 'file':
 
1178
                cur_file = open(self._limbo_name(trans_id), 'rb')
 
1179
                try:
 
1180
                    lines = osutils.chunks_to_lines(cur_file.readlines())
 
1181
                finally:
 
1182
                    cur_file.close()
 
1183
                parents = self._get_parents_lines(trans_id)
 
1184
                mpdiff = multiparent.MultiParent.from_lines(lines, parents)
 
1185
                content = ''.join(mpdiff.to_patch())
 
1186
            if kind == 'directory':
 
1187
                content = ''
 
1188
            if kind == 'symlink':
 
1189
                content = os.readlink(self._limbo_name(trans_id))
 
1190
            yield serializer.bytes_record(content, ((trans_id, kind),))
 
1191
 
 
1192
 
 
1193
    def deserialize(self, records):
 
1194
        """Deserialize a stored TreeTransform.
 
1195
 
 
1196
        :param records: An iterable of (names, content) tuples, as per
 
1197
            pack.ContainerPushParser.
 
1198
        """
 
1199
        names, content = records.next()
 
1200
        attribs = bencode.bdecode(content)
 
1201
        self._id_number = attribs['_id_number']
 
1202
        self._new_name = dict((k, v.decode('utf-8'))
 
1203
                            for k, v in attribs['_new_name'].items())
 
1204
        self._new_parent = attribs['_new_parent']
 
1205
        self._new_executability = dict((k, bool(v)) for k, v in
 
1206
            attribs['_new_executability'].items())
 
1207
        self._new_id = attribs['_new_id']
 
1208
        self._r_new_id = dict((v, k) for k, v in self._new_id.items())
 
1209
        self._tree_path_ids = {}
 
1210
        self._tree_id_paths = {}
 
1211
        for bytepath, trans_id in attribs['_tree_path_ids'].items():
 
1212
            path = bytepath.decode('utf-8')
 
1213
            self._tree_path_ids[path] = trans_id
 
1214
            self._tree_id_paths[trans_id] = path
 
1215
        self._removed_id = set(attribs['_removed_id'])
 
1216
        self._removed_contents = set(attribs['_removed_contents'])
 
1217
        self._non_present_ids = attribs['_non_present_ids']
 
1218
        for ((trans_id, kind),), content in records:
 
1219
            if kind == 'file':
 
1220
                mpdiff = multiparent.MultiParent.from_patch(content)
 
1221
                lines = mpdiff.to_lines(self._get_parents_texts(trans_id))
 
1222
                self.create_file(lines, trans_id)
 
1223
            if kind == 'directory':
 
1224
                self.create_directory(trans_id)
 
1225
            if kind == 'symlink':
 
1226
                self.create_symlink(content.decode('utf-8'), trans_id)
 
1227
 
 
1228
 
 
1229
class TreeTransform(TreeTransformBase):
 
1230
    """Represent a tree transformation.
 
1231
 
 
1232
    This object is designed to support incremental generation of the transform,
 
1233
    in any order.
 
1234
 
 
1235
    However, it gives optimum performance when parent directories are created
 
1236
    before their contents.  The transform is then able to put child files
 
1237
    directly in their parent directory, avoiding later renames.
 
1238
 
 
1239
    It is easy to produce malformed transforms, but they are generally
 
1240
    harmless.  Attempting to apply a malformed transform will cause an
 
1241
    exception to be raised before any modifications are made to the tree.
 
1242
 
 
1243
    Many kinds of malformed transforms can be corrected with the
 
1244
    resolve_conflicts function.  The remaining ones indicate programming error,
 
1245
    such as trying to create a file with no path.
 
1246
 
 
1247
    Two sets of file creation methods are supplied.  Convenience methods are:
 
1248
     * new_file
 
1249
     * new_directory
 
1250
     * new_symlink
 
1251
 
 
1252
    These are composed of the low-level methods:
 
1253
     * create_path
 
1254
     * create_file or create_directory or create_symlink
 
1255
     * version_file
 
1256
     * set_executability
 
1257
 
 
1258
    Transform/Transaction ids
 
1259
    -------------------------
 
1260
    trans_ids are temporary ids assigned to all files involved in a transform.
 
1261
    It's possible, even common, that not all files in the Tree have trans_ids.
 
1262
 
 
1263
    trans_ids are used because filenames and file_ids are not good enough
 
1264
    identifiers; filenames change, and not all files have file_ids.  File-ids
 
1265
    are also associated with trans-ids, so that moving a file moves its
 
1266
    file-id.
 
1267
 
 
1268
    trans_ids are only valid for the TreeTransform that generated them.
 
1269
 
 
1270
    Limbo
 
1271
    -----
 
1272
    Limbo is a temporary directory use to hold new versions of files.
 
1273
    Files are added to limbo by create_file, create_directory, create_symlink,
 
1274
    and their convenience variants (new_*).  Files may be removed from limbo
 
1275
    using cancel_creation.  Files are renamed from limbo into their final
 
1276
    location as part of TreeTransform.apply
 
1277
 
 
1278
    Limbo must be cleaned up, by either calling TreeTransform.apply or
 
1279
    calling TreeTransform.finalize.
 
1280
 
 
1281
    Files are placed into limbo inside their parent directories, where
 
1282
    possible.  This reduces subsequent renames, and makes operations involving
 
1283
    lots of files faster.  This optimization is only possible if the parent
 
1284
    directory is created *before* creating any of its children, so avoid
 
1285
    creating children before parents, where possible.
 
1286
 
 
1287
    Pending-deletion
 
1288
    ----------------
 
1289
    This temporary directory is used by _FileMover for storing files that are
 
1290
    about to be deleted.  In case of rollback, the files will be restored.
 
1291
    FileMover does not delete files until it is sure that a rollback will not
 
1292
    happen.
 
1293
    """
 
1294
    def __init__(self, tree, pb=DummyProgress()):
 
1295
        """Note: a tree_write lock is taken on the tree.
 
1296
 
 
1297
        Use TreeTransform.finalize() to release the lock (can be omitted if
 
1298
        TreeTransform.apply() called).
 
1299
        """
 
1300
        tree.lock_tree_write()
 
1301
 
 
1302
        try:
 
1303
            limbodir = urlutils.local_path_from_url(
 
1304
                tree._transport.abspath('limbo'))
 
1305
            try:
 
1306
                os.mkdir(limbodir)
 
1307
            except OSError, e:
 
1308
                if e.errno == errno.EEXIST:
 
1309
                    raise ExistingLimbo(limbodir)
 
1310
            deletiondir = urlutils.local_path_from_url(
 
1311
                tree._transport.abspath('pending-deletion'))
 
1312
            try:
 
1313
                os.mkdir(deletiondir)
 
1314
            except OSError, e:
 
1315
                if e.errno == errno.EEXIST:
 
1316
                    raise errors.ExistingPendingDeletion(deletiondir)
 
1317
        except:
 
1318
            tree.unlock()
 
1319
            raise
 
1320
 
 
1321
        TreeTransformBase.__init__(self, tree, limbodir, pb,
 
1322
                                   tree.case_sensitive)
 
1323
        self._deletiondir = deletiondir
 
1324
 
 
1325
    def apply(self, no_conflicts=False, precomputed_delta=None, _mover=None):
 
1326
        """Apply all changes to the inventory and filesystem.
 
1327
 
 
1328
        If filesystem or inventory conflicts are present, MalformedTransform
 
1329
        will be thrown.
 
1330
 
 
1331
        If apply succeeds, finalize is not necessary.
 
1332
 
 
1333
        :param no_conflicts: if True, the caller guarantees there are no
 
1334
            conflicts, so no check is made.
 
1335
        :param precomputed_delta: An inventory delta to use instead of
 
1336
            calculating one.
 
1337
        :param _mover: Supply an alternate FileMover, for testing
 
1338
        """
 
1339
        if not no_conflicts:
 
1340
            conflicts = self.find_conflicts()
 
1341
            if len(conflicts) != 0:
 
1342
                raise MalformedTransform(conflicts=conflicts)
 
1343
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1344
        try:
 
1345
            if precomputed_delta is None:
 
1346
                child_pb.update('Apply phase', 0, 2)
 
1347
                inventory_delta = self._generate_inventory_delta()
 
1348
                offset = 1
 
1349
            else:
 
1350
                inventory_delta = precomputed_delta
 
1351
                offset = 0
 
1352
            if _mover is None:
 
1353
                mover = _FileMover()
 
1354
            else:
 
1355
                mover = _mover
 
1356
            try:
 
1357
                child_pb.update('Apply phase', 0 + offset, 2 + offset)
 
1358
                self._apply_removals(mover)
 
1359
                child_pb.update('Apply phase', 1 + offset, 2 + offset)
 
1360
                modified_paths = self._apply_insertions(mover)
 
1361
            except:
 
1362
                mover.rollback()
 
1363
                raise
 
1364
            else:
 
1365
                mover.apply_deletions()
 
1366
        finally:
 
1367
            child_pb.finished()
 
1368
        self._tree.apply_inventory_delta(inventory_delta)
 
1369
        self._done = True
 
1370
        self.finalize()
 
1371
        return _TransformResults(modified_paths, self.rename_count)
 
1372
 
 
1373
    def _generate_inventory_delta(self):
 
1374
        """Generate an inventory delta for the current transform."""
 
1375
        inventory_delta = []
 
1376
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1377
        new_paths = self._inventory_altered()
 
1378
        total_entries = len(new_paths) + len(self._removed_id)
 
1379
        try:
 
1380
            for num, trans_id in enumerate(self._removed_id):
 
1381
                if (num % 10) == 0:
 
1382
                    child_pb.update('removing file', num, total_entries)
 
1383
                if trans_id == self._new_root:
 
1384
                    file_id = self._tree.get_root_id()
 
1385
                else:
 
1386
                    file_id = self.tree_file_id(trans_id)
 
1387
                # File-id isn't really being deleted, just moved
 
1388
                if file_id in self._r_new_id:
 
1389
                    continue
 
1390
                path = self._tree_id_paths[trans_id]
 
1391
                inventory_delta.append((path, None, file_id, None))
 
1392
            new_path_file_ids = dict((t, self.final_file_id(t)) for p, t in
 
1393
                                     new_paths)
 
1394
            entries = self._tree.iter_entries_by_dir(
 
1395
                new_path_file_ids.values())
 
1396
            old_paths = dict((e.file_id, p) for p, e in entries)
 
1397
            final_kinds = {}
 
1398
            for num, (path, trans_id) in enumerate(new_paths):
 
1399
                if (num % 10) == 0:
 
1400
                    child_pb.update('adding file',
 
1401
                                    num + len(self._removed_id), total_entries)
 
1402
                file_id = new_path_file_ids[trans_id]
 
1403
                if file_id is None:
 
1404
                    continue
 
1405
                needs_entry = False
 
1406
                try:
 
1407
                    kind = self.final_kind(trans_id)
 
1408
                except NoSuchFile:
 
1409
                    kind = self._tree.stored_kind(file_id)
 
1410
                parent_trans_id = self.final_parent(trans_id)
 
1411
                parent_file_id = new_path_file_ids.get(parent_trans_id)
 
1412
                if parent_file_id is None:
 
1413
                    parent_file_id = self.final_file_id(parent_trans_id)
 
1414
                if trans_id in self._new_reference_revision:
 
1415
                    new_entry = inventory.TreeReference(
 
1416
                        file_id,
 
1417
                        self._new_name[trans_id],
 
1418
                        self.final_file_id(self._new_parent[trans_id]),
 
1419
                        None, self._new_reference_revision[trans_id])
 
1420
                else:
 
1421
                    new_entry = inventory.make_entry(kind,
 
1422
                        self.final_name(trans_id),
 
1423
                        parent_file_id, file_id)
 
1424
                old_path = old_paths.get(new_entry.file_id)
 
1425
                new_executability = self._new_executability.get(trans_id)
 
1426
                if new_executability is not None:
 
1427
                    new_entry.executable = new_executability
 
1428
                inventory_delta.append(
 
1429
                    (old_path, path, new_entry.file_id, new_entry))
 
1430
        finally:
 
1431
            child_pb.finished()
 
1432
        return inventory_delta
 
1433
 
 
1434
    def _apply_removals(self, mover):
 
1435
        """Perform tree operations that remove directory/inventory names.
 
1436
 
 
1437
        That is, delete files that are to be deleted, and put any files that
 
1438
        need renaming into limbo.  This must be done in strict child-to-parent
 
1439
        order.
 
1440
 
 
1441
        If inventory_delta is None, no inventory delta generation is performed.
 
1442
        """
 
1443
        tree_paths = list(self._tree_path_ids.iteritems())
 
1444
        tree_paths.sort(reverse=True)
 
1445
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1446
        try:
 
1447
            for num, data in enumerate(tree_paths):
 
1448
                path, trans_id = data
 
1449
                child_pb.update('removing file', num, len(tree_paths))
 
1450
                full_path = self._tree.abspath(path)
 
1451
                if trans_id in self._removed_contents:
 
1452
                    mover.pre_delete(full_path, os.path.join(self._deletiondir,
 
1453
                                     trans_id))
 
1454
                elif trans_id in self._new_name or trans_id in \
 
1455
                    self._new_parent:
 
1456
                    try:
 
1457
                        mover.rename(full_path, self._limbo_name(trans_id))
 
1458
                    except OSError, e:
 
1459
                        if e.errno != errno.ENOENT:
 
1460
                            raise
 
1461
                    else:
 
1462
                        self.rename_count += 1
 
1463
        finally:
 
1464
            child_pb.finished()
 
1465
 
 
1466
    def _apply_insertions(self, mover):
 
1467
        """Perform tree operations that insert directory/inventory names.
 
1468
 
 
1469
        That is, create any files that need to be created, and restore from
 
1470
        limbo any files that needed renaming.  This must be done in strict
 
1471
        parent-to-child order.
 
1472
 
 
1473
        If inventory_delta is None, no inventory delta is calculated, and
 
1474
        no list of modified paths is returned.
 
1475
        """
 
1476
        new_paths = self.new_paths(filesystem_only=True)
 
1477
        modified_paths = []
 
1478
        new_path_file_ids = dict((t, self.final_file_id(t)) for p, t in
 
1479
                                 new_paths)
 
1480
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1481
        try:
 
1482
            for num, (path, trans_id) in enumerate(new_paths):
 
1483
                if (num % 10) == 0:
 
1484
                    child_pb.update('adding file', num, len(new_paths))
 
1485
                full_path = self._tree.abspath(path)
 
1486
                if trans_id in self._needs_rename:
 
1487
                    try:
 
1488
                        mover.rename(self._limbo_name(trans_id), full_path)
 
1489
                    except OSError, e:
 
1490
                        # We may be renaming a dangling inventory id
 
1491
                        if e.errno != errno.ENOENT:
 
1492
                            raise
 
1493
                    else:
 
1494
                        self.rename_count += 1
 
1495
                if (trans_id in self._new_contents or
 
1496
                    self.path_changed(trans_id)):
 
1497
                    if trans_id in self._new_contents:
 
1498
                        modified_paths.append(full_path)
 
1499
                if trans_id in self._new_executability:
 
1500
                    self._set_executability(path, trans_id)
 
1501
        finally:
 
1502
            child_pb.finished()
 
1503
        self._new_contents.clear()
 
1504
        return modified_paths
 
1505
 
 
1506
 
 
1507
class TransformPreview(TreeTransformBase):
 
1508
    """A TreeTransform for generating preview trees.
 
1509
 
 
1510
    Unlike TreeTransform, this version works when the input tree is a
 
1511
    RevisionTree, rather than a WorkingTree.  As a result, it tends to ignore
 
1512
    unversioned files in the input tree.
 
1513
    """
 
1514
 
 
1515
    def __init__(self, tree, pb=DummyProgress(), case_sensitive=True):
 
1516
        tree.lock_read()
 
1517
        limbodir = osutils.mkdtemp(prefix='bzr-limbo-')
 
1518
        TreeTransformBase.__init__(self, tree, limbodir, pb, case_sensitive)
 
1519
 
 
1520
    def canonical_path(self, path):
 
1521
        return path
 
1522
 
 
1523
    def tree_kind(self, trans_id):
 
1524
        path = self._tree_id_paths.get(trans_id)
 
1525
        if path is None:
 
1526
            raise NoSuchFile(None)
 
1527
        file_id = self._tree.path2id(path)
 
1528
        return self._tree.kind(file_id)
 
1529
 
 
1530
    def _set_mode(self, trans_id, mode_id, typefunc):
 
1531
        """Set the mode of new file contents.
 
1532
        The mode_id is the existing file to get the mode from (often the same
 
1533
        as trans_id).  The operation is only performed if there's a mode match
 
1534
        according to typefunc.
 
1535
        """
 
1536
        # is it ok to ignore this?  probably
 
1537
        pass
 
1538
 
 
1539
    def iter_tree_children(self, parent_id):
 
1540
        """Iterate through the entry's tree children, if any"""
 
1541
        try:
 
1542
            path = self._tree_id_paths[parent_id]
 
1543
        except KeyError:
 
1544
            return
 
1545
        file_id = self.tree_file_id(parent_id)
 
1546
        if file_id is None:
 
1547
            return
 
1548
        entry = self._tree.iter_entries_by_dir([file_id]).next()[1]
 
1549
        children = getattr(entry, 'children', {})
 
1550
        for child in children:
 
1551
            childpath = joinpath(path, child)
 
1552
            yield self.trans_id_tree_path(childpath)
 
1553
 
 
1554
 
 
1555
class _PreviewTree(tree.Tree):
 
1556
    """Partial implementation of Tree to support show_diff_trees"""
 
1557
 
 
1558
    def __init__(self, transform):
 
1559
        self._transform = transform
 
1560
        self._final_paths = FinalPaths(transform)
 
1561
        self.__by_parent = None
 
1562
        self._parent_ids = []
 
1563
        self._all_children_cache = {}
 
1564
        self._path2trans_id_cache = {}
 
1565
        self._final_name_cache = {}
 
1566
 
 
1567
    def _changes(self, file_id):
 
1568
        for changes in self._transform.iter_changes():
 
1569
            if changes[0] == file_id:
 
1570
                return changes
 
1571
 
 
1572
    def _content_change(self, file_id):
 
1573
        """Return True if the content of this file changed"""
 
1574
        changes = self._changes(file_id)
 
1575
        # changes[2] is true if the file content changed.  See
 
1576
        # InterTree.iter_changes.
 
1577
        return (changes is not None and changes[2])
 
1578
 
 
1579
    def _get_repository(self):
 
1580
        repo = getattr(self._transform._tree, '_repository', None)
 
1581
        if repo is None:
 
1582
            repo = self._transform._tree.branch.repository
 
1583
        return repo
 
1584
 
 
1585
    def _iter_parent_trees(self):
 
1586
        for revision_id in self.get_parent_ids():
 
1587
            try:
 
1588
                yield self.revision_tree(revision_id)
 
1589
            except errors.NoSuchRevisionInTree:
 
1590
                yield self._get_repository().revision_tree(revision_id)
 
1591
 
 
1592
    def _get_file_revision(self, file_id, vf, tree_revision):
 
1593
        parent_keys = [(file_id, self._file_revision(t, file_id)) for t in
 
1594
                       self._iter_parent_trees()]
 
1595
        vf.add_lines((file_id, tree_revision), parent_keys,
 
1596
                     self.get_file(file_id).readlines())
 
1597
        repo = self._get_repository()
 
1598
        base_vf = repo.texts
 
1599
        if base_vf not in vf.fallback_versionedfiles:
 
1600
            vf.fallback_versionedfiles.append(base_vf)
 
1601
        return tree_revision
 
1602
 
 
1603
    def _stat_limbo_file(self, file_id):
 
1604
        trans_id = self._transform.trans_id_file_id(file_id)
 
1605
        name = self._transform._limbo_name(trans_id)
 
1606
        return os.lstat(name)
 
1607
 
 
1608
    @property
 
1609
    def _by_parent(self):
 
1610
        if self.__by_parent is None:
 
1611
            self.__by_parent = self._transform.by_parent()
 
1612
        return self.__by_parent
 
1613
 
 
1614
    def _comparison_data(self, entry, path):
 
1615
        kind, size, executable, link_or_sha1 = self.path_content_summary(path)
 
1616
        if kind == 'missing':
 
1617
            kind = None
 
1618
            executable = False
 
1619
        else:
 
1620
            file_id = self._transform.final_file_id(self._path2trans_id(path))
 
1621
            executable = self.is_executable(file_id, path)
 
1622
        return kind, executable, None
 
1623
 
 
1624
    def lock_read(self):
 
1625
        # Perhaps in theory, this should lock the TreeTransform?
 
1626
        pass
 
1627
 
 
1628
    def unlock(self):
 
1629
        pass
 
1630
 
 
1631
    @property
 
1632
    def inventory(self):
 
1633
        """This Tree does not use inventory as its backing data."""
 
1634
        raise NotImplementedError(_PreviewTree.inventory)
 
1635
 
 
1636
    def get_root_id(self):
 
1637
        return self._transform.final_file_id(self._transform.root)
 
1638
 
 
1639
    def all_file_ids(self):
 
1640
        tree_ids = set(self._transform._tree.all_file_ids())
 
1641
        tree_ids.difference_update(self._transform.tree_file_id(t)
 
1642
                                   for t in self._transform._removed_id)
 
1643
        tree_ids.update(self._transform._new_id.values())
 
1644
        return tree_ids
 
1645
 
 
1646
    def __iter__(self):
 
1647
        return iter(self.all_file_ids())
 
1648
 
 
1649
    def has_id(self, file_id):
 
1650
        if file_id in self._transform._r_new_id:
 
1651
            return True
 
1652
        elif file_id in set([self._transform.tree_file_id(trans_id) for
 
1653
            trans_id in self._transform._removed_id]):
 
1654
            return False
 
1655
        else:
 
1656
            return self._transform._tree.has_id(file_id)
 
1657
 
 
1658
    def _path2trans_id(self, path):
 
1659
        # We must not use None here, because that is a valid value to store.
 
1660
        trans_id = self._path2trans_id_cache.get(path, object)
 
1661
        if trans_id is not object:
 
1662
            return trans_id
 
1663
        segments = splitpath(path)
 
1664
        cur_parent = self._transform.root
 
1665
        for cur_segment in segments:
 
1666
            for child in self._all_children(cur_parent):
 
1667
                final_name = self._final_name_cache.get(child)
 
1668
                if final_name is None:
 
1669
                    final_name = self._transform.final_name(child)
 
1670
                    self._final_name_cache[child] = final_name
 
1671
                if final_name == cur_segment:
 
1672
                    cur_parent = child
 
1673
                    break
 
1674
            else:
 
1675
                self._path2trans_id_cache[path] = None
 
1676
                return None
 
1677
        self._path2trans_id_cache[path] = cur_parent
 
1678
        return cur_parent
 
1679
 
 
1680
    def path2id(self, path):
 
1681
        return self._transform.final_file_id(self._path2trans_id(path))
 
1682
 
 
1683
    def id2path(self, file_id):
 
1684
        trans_id = self._transform.trans_id_file_id(file_id)
 
1685
        try:
 
1686
            return self._final_paths._determine_path(trans_id)
 
1687
        except NoFinalPath:
 
1688
            raise errors.NoSuchId(self, file_id)
 
1689
 
 
1690
    def _all_children(self, trans_id):
 
1691
        children = self._all_children_cache.get(trans_id)
 
1692
        if children is not None:
 
1693
            return children
 
1694
        children = set(self._transform.iter_tree_children(trans_id))
 
1695
        # children in the _new_parent set are provided by _by_parent.
 
1696
        children.difference_update(self._transform._new_parent.keys())
 
1697
        children.update(self._by_parent.get(trans_id, []))
 
1698
        self._all_children_cache[trans_id] = children
 
1699
        return children
 
1700
 
 
1701
    def iter_children(self, file_id):
 
1702
        trans_id = self._transform.trans_id_file_id(file_id)
 
1703
        for child_trans_id in self._all_children(trans_id):
 
1704
            yield self._transform.final_file_id(child_trans_id)
 
1705
 
 
1706
    def extras(self):
 
1707
        possible_extras = set(self._transform.trans_id_tree_path(p) for p
 
1708
                              in self._transform._tree.extras())
 
1709
        possible_extras.update(self._transform._new_contents)
 
1710
        possible_extras.update(self._transform._removed_id)
 
1711
        for trans_id in possible_extras:
 
1712
            if self._transform.final_file_id(trans_id) is None:
 
1713
                yield self._final_paths._determine_path(trans_id)
 
1714
 
 
1715
    def _make_inv_entries(self, ordered_entries, specific_file_ids):
 
1716
        for trans_id, parent_file_id in ordered_entries:
 
1717
            file_id = self._transform.final_file_id(trans_id)
 
1718
            if file_id is None:
 
1719
                continue
 
1720
            if (specific_file_ids is not None
 
1721
                and file_id not in specific_file_ids):
 
1722
                continue
 
1723
            try:
 
1724
                kind = self._transform.final_kind(trans_id)
 
1725
            except NoSuchFile:
 
1726
                kind = self._transform._tree.stored_kind(file_id)
 
1727
            new_entry = inventory.make_entry(
 
1728
                kind,
 
1729
                self._transform.final_name(trans_id),
 
1730
                parent_file_id, file_id)
 
1731
            yield new_entry, trans_id
 
1732
 
 
1733
    def _list_files_by_dir(self):
 
1734
        todo = [ROOT_PARENT]
 
1735
        ordered_ids = []
 
1736
        while len(todo) > 0:
 
1737
            parent = todo.pop()
 
1738
            parent_file_id = self._transform.final_file_id(parent)
 
1739
            children = list(self._all_children(parent))
 
1740
            paths = dict(zip(children, self._final_paths.get_paths(children)))
 
1741
            children.sort(key=paths.get)
 
1742
            todo.extend(reversed(children))
 
1743
            for trans_id in children:
 
1744
                ordered_ids.append((trans_id, parent_file_id))
 
1745
        return ordered_ids
 
1746
 
 
1747
    def iter_entries_by_dir(self, specific_file_ids=None):
 
1748
        # This may not be a maximally efficient implementation, but it is
 
1749
        # reasonably straightforward.  An implementation that grafts the
 
1750
        # TreeTransform changes onto the tree's iter_entries_by_dir results
 
1751
        # might be more efficient, but requires tricky inferences about stack
 
1752
        # position.
 
1753
        ordered_ids = self._list_files_by_dir()
 
1754
        for entry, trans_id in self._make_inv_entries(ordered_ids,
 
1755
                                                      specific_file_ids):
 
1756
            yield unicode(self._final_paths.get_path(trans_id)), entry
 
1757
 
 
1758
    def list_files(self, include_root=False):
 
1759
        """See Tree.list_files."""
 
1760
        # XXX This should behave like WorkingTree.list_files, but is really
 
1761
        # more like RevisionTree.list_files.
 
1762
        for path, entry in self.iter_entries_by_dir():
 
1763
            if entry.name == '' and not include_root:
 
1764
                continue
 
1765
            yield path, 'V', entry.kind, entry.file_id, entry
 
1766
 
 
1767
    def kind(self, file_id):
 
1768
        trans_id = self._transform.trans_id_file_id(file_id)
 
1769
        return self._transform.final_kind(trans_id)
 
1770
 
 
1771
    def stored_kind(self, file_id):
 
1772
        trans_id = self._transform.trans_id_file_id(file_id)
 
1773
        try:
 
1774
            return self._transform._new_contents[trans_id]
 
1775
        except KeyError:
 
1776
            return self._transform._tree.stored_kind(file_id)
 
1777
 
 
1778
    def get_file_mtime(self, file_id, path=None):
 
1779
        """See Tree.get_file_mtime"""
 
1780
        if not self._content_change(file_id):
 
1781
            return self._transform._tree.get_file_mtime(file_id, path)
 
1782
        return self._stat_limbo_file(file_id).st_mtime
 
1783
 
 
1784
    def _file_size(self, entry, stat_value):
 
1785
        return self.get_file_size(entry.file_id)
 
1786
 
 
1787
    def get_file_size(self, file_id):
 
1788
        """See Tree.get_file_size"""
 
1789
        if self.kind(file_id) == 'file':
 
1790
            return self._transform._tree.get_file_size(file_id)
 
1791
        else:
 
1792
            return None
 
1793
 
 
1794
    def get_file_sha1(self, file_id, path=None, stat_value=None):
 
1795
        trans_id = self._transform.trans_id_file_id(file_id)
 
1796
        kind = self._transform._new_contents.get(trans_id)
 
1797
        if kind is None:
 
1798
            return self._transform._tree.get_file_sha1(file_id)
 
1799
        if kind == 'file':
 
1800
            fileobj = self.get_file(file_id)
 
1801
            try:
 
1802
                return sha_file(fileobj)
 
1803
            finally:
 
1804
                fileobj.close()
 
1805
 
 
1806
    def is_executable(self, file_id, path=None):
 
1807
        if file_id is None:
 
1808
            return False
 
1809
        trans_id = self._transform.trans_id_file_id(file_id)
 
1810
        try:
 
1811
            return self._transform._new_executability[trans_id]
 
1812
        except KeyError:
 
1813
            try:
 
1814
                return self._transform._tree.is_executable(file_id, path)
 
1815
            except OSError, e:
 
1816
                if e.errno == errno.ENOENT:
 
1817
                    return False
 
1818
                raise
 
1819
            except errors.NoSuchId:
 
1820
                return False
 
1821
 
 
1822
    def path_content_summary(self, path):
 
1823
        trans_id = self._path2trans_id(path)
 
1824
        tt = self._transform
 
1825
        tree_path = tt._tree_id_paths.get(trans_id)
 
1826
        kind = tt._new_contents.get(trans_id)
 
1827
        if kind is None:
 
1828
            if tree_path is None or trans_id in tt._removed_contents:
 
1829
                return 'missing', None, None, None
 
1830
            summary = tt._tree.path_content_summary(tree_path)
 
1831
            kind, size, executable, link_or_sha1 = summary
 
1832
        else:
 
1833
            link_or_sha1 = None
 
1834
            limbo_name = tt._limbo_name(trans_id)
 
1835
            if trans_id in tt._new_reference_revision:
 
1836
                kind = 'tree-reference'
 
1837
            if kind == 'file':
 
1838
                statval = os.lstat(limbo_name)
 
1839
                size = statval.st_size
 
1840
                if not supports_executable():
 
1841
                    executable = None
 
1842
                else:
 
1843
                    executable = statval.st_mode & S_IEXEC
 
1844
            else:
 
1845
                size = None
 
1846
                executable = None
 
1847
            if kind == 'symlink':
 
1848
                link_or_sha1 = os.readlink(limbo_name)
 
1849
        if supports_executable():
 
1850
            executable = tt._new_executability.get(trans_id, executable)
 
1851
        return kind, size, executable, link_or_sha1
 
1852
 
 
1853
    def iter_changes(self, from_tree, include_unchanged=False,
 
1854
                      specific_files=None, pb=None, extra_trees=None,
 
1855
                      require_versioned=True, want_unversioned=False):
 
1856
        """See InterTree.iter_changes.
 
1857
 
 
1858
        This has a fast path that is only used when the from_tree matches
 
1859
        the transform tree, and no fancy options are supplied.
 
1860
        """
 
1861
        if (from_tree is not self._transform._tree or include_unchanged or
 
1862
            specific_files or want_unversioned):
 
1863
            return tree.InterTree(from_tree, self).iter_changes(
 
1864
                include_unchanged=include_unchanged,
 
1865
                specific_files=specific_files,
 
1866
                pb=pb,
 
1867
                extra_trees=extra_trees,
 
1868
                require_versioned=require_versioned,
 
1869
                want_unversioned=want_unversioned)
 
1870
        if want_unversioned:
 
1871
            raise ValueError('want_unversioned is not supported')
 
1872
        return self._transform.iter_changes()
 
1873
 
 
1874
    def get_file(self, file_id, path=None):
 
1875
        """See Tree.get_file"""
 
1876
        if not self._content_change(file_id):
 
1877
            return self._transform._tree.get_file(file_id, path)
 
1878
        trans_id = self._transform.trans_id_file_id(file_id)
 
1879
        name = self._transform._limbo_name(trans_id)
 
1880
        return open(name, 'rb')
 
1881
 
 
1882
    def annotate_iter(self, file_id,
 
1883
                      default_revision=_mod_revision.CURRENT_REVISION):
 
1884
        changes = self._changes(file_id)
 
1885
        if changes is None:
 
1886
            get_old = True
 
1887
        else:
 
1888
            changed_content, versioned, kind = (changes[2], changes[3],
 
1889
                                                changes[6])
 
1890
            if kind[1] is None:
 
1891
                return None
 
1892
            get_old = (kind[0] == 'file' and versioned[0])
 
1893
        if get_old:
 
1894
            old_annotation = self._transform._tree.annotate_iter(file_id,
 
1895
                default_revision=default_revision)
 
1896
        else:
 
1897
            old_annotation = []
 
1898
        if changes is None:
 
1899
            return old_annotation
 
1900
        if not changed_content:
 
1901
            return old_annotation
 
1902
        return annotate.reannotate([old_annotation],
 
1903
                                   self.get_file(file_id).readlines(),
 
1904
                                   default_revision)
 
1905
 
 
1906
    def get_symlink_target(self, file_id):
 
1907
        """See Tree.get_symlink_target"""
 
1908
        if not self._content_change(file_id):
 
1909
            return self._transform._tree.get_symlink_target(file_id)
 
1910
        trans_id = self._transform.trans_id_file_id(file_id)
 
1911
        name = self._transform._limbo_name(trans_id)
 
1912
        return os.readlink(name)
 
1913
 
 
1914
    def walkdirs(self, prefix=''):
 
1915
        pending = [self._transform.root]
 
1916
        while len(pending) > 0:
 
1917
            parent_id = pending.pop()
 
1918
            children = []
 
1919
            subdirs = []
 
1920
            prefix = prefix.rstrip('/')
 
1921
            parent_path = self._final_paths.get_path(parent_id)
 
1922
            parent_file_id = self._transform.final_file_id(parent_id)
 
1923
            for child_id in self._all_children(parent_id):
 
1924
                path_from_root = self._final_paths.get_path(child_id)
 
1925
                basename = self._transform.final_name(child_id)
 
1926
                file_id = self._transform.final_file_id(child_id)
 
1927
                try:
 
1928
                    kind = self._transform.final_kind(child_id)
 
1929
                    versioned_kind = kind
 
1930
                except NoSuchFile:
 
1931
                    kind = 'unknown'
 
1932
                    versioned_kind = self._transform._tree.stored_kind(file_id)
 
1933
                if versioned_kind == 'directory':
 
1934
                    subdirs.append(child_id)
 
1935
                children.append((path_from_root, basename, kind, None,
 
1936
                                 file_id, versioned_kind))
 
1937
            children.sort()
 
1938
            if parent_path.startswith(prefix):
 
1939
                yield (parent_path, parent_file_id), children
 
1940
            pending.extend(sorted(subdirs, key=self._final_paths.get_path,
 
1941
                                  reverse=True))
 
1942
 
 
1943
    def get_parent_ids(self):
 
1944
        return self._parent_ids
 
1945
 
 
1946
    def set_parent_ids(self, parent_ids):
 
1947
        self._parent_ids = parent_ids
 
1948
 
 
1949
    def get_revision_tree(self, revision_id):
 
1950
        return self._transform._tree.get_revision_tree(revision_id)
 
1951
 
 
1952
 
 
1953
def joinpath(parent, child):
 
1954
    """Join tree-relative paths, handling the tree root specially"""
 
1955
    if parent is None or parent == "":
 
1956
        return child
 
1957
    else:
 
1958
        return pathjoin(parent, child)
 
1959
 
 
1960
 
 
1961
class FinalPaths(object):
 
1962
    """Make path calculation cheap by memoizing paths.
 
1963
 
 
1964
    The underlying tree must not be manipulated between calls, or else
 
1965
    the results will likely be incorrect.
 
1966
    """
 
1967
    def __init__(self, transform):
 
1968
        object.__init__(self)
 
1969
        self._known_paths = {}
 
1970
        self.transform = transform
 
1971
 
 
1972
    def _determine_path(self, trans_id):
 
1973
        if trans_id == self.transform.root:
 
1974
            return ""
 
1975
        name = self.transform.final_name(trans_id)
 
1976
        parent_id = self.transform.final_parent(trans_id)
 
1977
        if parent_id == self.transform.root:
 
1978
            return name
 
1979
        else:
 
1980
            return pathjoin(self.get_path(parent_id), name)
 
1981
 
 
1982
    def get_path(self, trans_id):
 
1983
        """Find the final path associated with a trans_id"""
 
1984
        if trans_id not in self._known_paths:
 
1985
            self._known_paths[trans_id] = self._determine_path(trans_id)
 
1986
        return self._known_paths[trans_id]
 
1987
 
 
1988
    def get_paths(self, trans_ids):
 
1989
        return [(self.get_path(t), t) for t in trans_ids]
 
1990
 
 
1991
 
 
1992
 
 
1993
def topology_sorted_ids(tree):
 
1994
    """Determine the topological order of the ids in a tree"""
 
1995
    file_ids = list(tree)
 
1996
    file_ids.sort(key=tree.id2path)
 
1997
    return file_ids
 
1998
 
 
1999
 
 
2000
def build_tree(tree, wt, accelerator_tree=None, hardlink=False,
 
2001
               delta_from_tree=False):
 
2002
    """Create working tree for a branch, using a TreeTransform.
 
2003
    
 
2004
    This function should be used on empty trees, having a tree root at most.
 
2005
    (see merge and revert functionality for working with existing trees)
 
2006
 
 
2007
    Existing files are handled like so:
 
2008
    
 
2009
    - Existing bzrdirs take precedence over creating new items.  They are
 
2010
      created as '%s.diverted' % name.
 
2011
    - Otherwise, if the content on disk matches the content we are building,
 
2012
      it is silently replaced.
 
2013
    - Otherwise, conflict resolution will move the old file to 'oldname.moved'.
 
2014
 
 
2015
    :param tree: The tree to convert wt into a copy of
 
2016
    :param wt: The working tree that files will be placed into
 
2017
    :param accelerator_tree: A tree which can be used for retrieving file
 
2018
        contents more quickly than tree itself, i.e. a workingtree.  tree
 
2019
        will be used for cases where accelerator_tree's content is different.
 
2020
    :param hardlink: If true, hard-link files to accelerator_tree, where
 
2021
        possible.  accelerator_tree must implement abspath, i.e. be a
 
2022
        working tree.
 
2023
    :param delta_from_tree: If true, build_tree may use the input Tree to
 
2024
        generate the inventory delta.
 
2025
    """
 
2026
    wt.lock_tree_write()
 
2027
    try:
 
2028
        tree.lock_read()
 
2029
        try:
 
2030
            if accelerator_tree is not None:
 
2031
                accelerator_tree.lock_read()
 
2032
            try:
 
2033
                return _build_tree(tree, wt, accelerator_tree, hardlink,
 
2034
                                   delta_from_tree)
 
2035
            finally:
 
2036
                if accelerator_tree is not None:
 
2037
                    accelerator_tree.unlock()
 
2038
        finally:
 
2039
            tree.unlock()
 
2040
    finally:
 
2041
        wt.unlock()
 
2042
 
 
2043
 
 
2044
def _build_tree(tree, wt, accelerator_tree, hardlink, delta_from_tree):
 
2045
    """See build_tree."""
 
2046
    for num, _unused in enumerate(wt.all_file_ids()):
 
2047
        if num > 0:  # more than just a root
 
2048
            raise errors.WorkingTreeAlreadyPopulated(base=wt.basedir)
 
2049
    existing_files = set()
 
2050
    for dir, files in wt.walkdirs():
 
2051
        existing_files.update(f[0] for f in files)
 
2052
    file_trans_id = {}
 
2053
    top_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2054
    pp = ProgressPhase("Build phase", 2, top_pb)
 
2055
    if tree.inventory.root is not None:
 
2056
        # This is kind of a hack: we should be altering the root
 
2057
        # as part of the regular tree shape diff logic.
 
2058
        # The conditional test here is to avoid doing an
 
2059
        # expensive operation (flush) every time the root id
 
2060
        # is set within the tree, nor setting the root and thus
 
2061
        # marking the tree as dirty, because we use two different
 
2062
        # idioms here: tree interfaces and inventory interfaces.
 
2063
        if wt.get_root_id() != tree.get_root_id():
 
2064
            wt.set_root_id(tree.get_root_id())
 
2065
            wt.flush()
 
2066
    tt = TreeTransform(wt)
 
2067
    divert = set()
 
2068
    try:
 
2069
        pp.next_phase()
 
2070
        file_trans_id[wt.get_root_id()] = \
 
2071
            tt.trans_id_tree_file_id(wt.get_root_id())
 
2072
        pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2073
        try:
 
2074
            deferred_contents = []
 
2075
            num = 0
 
2076
            total = len(tree.inventory)
 
2077
            if delta_from_tree:
 
2078
                precomputed_delta = []
 
2079
            else:
 
2080
                precomputed_delta = None
 
2081
            for num, (tree_path, entry) in \
 
2082
                enumerate(tree.inventory.iter_entries_by_dir()):
 
2083
                pb.update("Building tree", num - len(deferred_contents), total)
 
2084
                if entry.parent_id is None:
 
2085
                    continue
 
2086
                reparent = False
 
2087
                file_id = entry.file_id
 
2088
                if delta_from_tree:
 
2089
                    precomputed_delta.append((None, tree_path, file_id, entry))
 
2090
                if tree_path in existing_files:
 
2091
                    target_path = wt.abspath(tree_path)
 
2092
                    kind = file_kind(target_path)
 
2093
                    if kind == "directory":
 
2094
                        try:
 
2095
                            bzrdir.BzrDir.open(target_path)
 
2096
                        except errors.NotBranchError:
 
2097
                            pass
 
2098
                        else:
 
2099
                            divert.add(file_id)
 
2100
                    if (file_id not in divert and
 
2101
                        _content_match(tree, entry, file_id, kind,
 
2102
                        target_path)):
 
2103
                        tt.delete_contents(tt.trans_id_tree_path(tree_path))
 
2104
                        if kind == 'directory':
 
2105
                            reparent = True
 
2106
                parent_id = file_trans_id[entry.parent_id]
 
2107
                if entry.kind == 'file':
 
2108
                    # We *almost* replicate new_by_entry, so that we can defer
 
2109
                    # getting the file text, and get them all at once.
 
2110
                    trans_id = tt.create_path(entry.name, parent_id)
 
2111
                    file_trans_id[file_id] = trans_id
 
2112
                    tt.version_file(file_id, trans_id)
 
2113
                    executable = tree.is_executable(file_id, tree_path)
 
2114
                    if executable:
 
2115
                        tt.set_executability(executable, trans_id)
 
2116
                    deferred_contents.append((file_id, trans_id))
 
2117
                else:
 
2118
                    file_trans_id[file_id] = new_by_entry(tt, entry, parent_id,
 
2119
                                                          tree)
 
2120
                if reparent:
 
2121
                    new_trans_id = file_trans_id[file_id]
 
2122
                    old_parent = tt.trans_id_tree_path(tree_path)
 
2123
                    _reparent_children(tt, old_parent, new_trans_id)
 
2124
            offset = num + 1 - len(deferred_contents)
 
2125
            _create_files(tt, tree, deferred_contents, pb, offset,
 
2126
                          accelerator_tree, hardlink)
 
2127
        finally:
 
2128
            pb.finished()
 
2129
        pp.next_phase()
 
2130
        divert_trans = set(file_trans_id[f] for f in divert)
 
2131
        resolver = lambda t, c: resolve_checkout(t, c, divert_trans)
 
2132
        raw_conflicts = resolve_conflicts(tt, pass_func=resolver)
 
2133
        if len(raw_conflicts) > 0:
 
2134
            precomputed_delta = None
 
2135
        conflicts = cook_conflicts(raw_conflicts, tt)
 
2136
        for conflict in conflicts:
 
2137
            warning(conflict)
 
2138
        try:
 
2139
            wt.add_conflicts(conflicts)
 
2140
        except errors.UnsupportedOperation:
 
2141
            pass
 
2142
        result = tt.apply(no_conflicts=True,
 
2143
                          precomputed_delta=precomputed_delta)
 
2144
    finally:
 
2145
        tt.finalize()
 
2146
        top_pb.finished()
 
2147
    return result
 
2148
 
 
2149
 
 
2150
def _create_files(tt, tree, desired_files, pb, offset, accelerator_tree,
 
2151
                  hardlink):
 
2152
    total = len(desired_files) + offset
 
2153
    if accelerator_tree is None:
 
2154
        new_desired_files = desired_files
 
2155
    else:
 
2156
        iter = accelerator_tree.iter_changes(tree, include_unchanged=True)
 
2157
        unchanged = dict((f, p[1]) for (f, p, c, v, d, n, k, e)
 
2158
                         in iter if not (c or e[0] != e[1]))
 
2159
        new_desired_files = []
 
2160
        count = 0
 
2161
        for file_id, trans_id in desired_files:
 
2162
            accelerator_path = unchanged.get(file_id)
 
2163
            if accelerator_path is None:
 
2164
                new_desired_files.append((file_id, trans_id))
 
2165
                continue
 
2166
            pb.update('Adding file contents', count + offset, total)
 
2167
            if hardlink:
 
2168
                tt.create_hardlink(accelerator_tree.abspath(accelerator_path),
 
2169
                                   trans_id)
 
2170
            else:
 
2171
                contents = accelerator_tree.get_file(file_id, accelerator_path)
 
2172
                try:
 
2173
                    tt.create_file(contents, trans_id)
 
2174
                finally:
 
2175
                    contents.close()
 
2176
            count += 1
 
2177
        offset += count
 
2178
    for count, (trans_id, contents) in enumerate(tree.iter_files_bytes(
 
2179
                                                 new_desired_files)):
 
2180
        tt.create_file(contents, trans_id)
 
2181
        pb.update('Adding file contents', count + offset, total)
 
2182
 
 
2183
 
 
2184
def _reparent_children(tt, old_parent, new_parent):
 
2185
    for child in tt.iter_tree_children(old_parent):
 
2186
        tt.adjust_path(tt.final_name(child), new_parent, child)
 
2187
 
 
2188
def _reparent_transform_children(tt, old_parent, new_parent):
 
2189
    by_parent = tt.by_parent()
 
2190
    for child in by_parent[old_parent]:
 
2191
        tt.adjust_path(tt.final_name(child), new_parent, child)
 
2192
    return by_parent[old_parent]
 
2193
 
 
2194
def _content_match(tree, entry, file_id, kind, target_path):
 
2195
    if entry.kind != kind:
 
2196
        return False
 
2197
    if entry.kind == "directory":
 
2198
        return True
 
2199
    if entry.kind == "file":
 
2200
        if tree.get_file(file_id).read() == file(target_path, 'rb').read():
 
2201
            return True
 
2202
    elif entry.kind == "symlink":
 
2203
        if tree.get_symlink_target(file_id) == os.readlink(target_path):
 
2204
            return True
 
2205
    return False
 
2206
 
 
2207
 
 
2208
def resolve_checkout(tt, conflicts, divert):
 
2209
    new_conflicts = set()
 
2210
    for c_type, conflict in ((c[0], c) for c in conflicts):
 
2211
        # Anything but a 'duplicate' would indicate programmer error
 
2212
        if c_type != 'duplicate':
 
2213
            raise AssertionError(c_type)
 
2214
        # Now figure out which is new and which is old
 
2215
        if tt.new_contents(conflict[1]):
 
2216
            new_file = conflict[1]
 
2217
            old_file = conflict[2]
 
2218
        else:
 
2219
            new_file = conflict[2]
 
2220
            old_file = conflict[1]
 
2221
 
 
2222
        # We should only get here if the conflict wasn't completely
 
2223
        # resolved
 
2224
        final_parent = tt.final_parent(old_file)
 
2225
        if new_file in divert:
 
2226
            new_name = tt.final_name(old_file)+'.diverted'
 
2227
            tt.adjust_path(new_name, final_parent, new_file)
 
2228
            new_conflicts.add((c_type, 'Diverted to',
 
2229
                               new_file, old_file))
 
2230
        else:
 
2231
            new_name = tt.final_name(old_file)+'.moved'
 
2232
            tt.adjust_path(new_name, final_parent, old_file)
 
2233
            new_conflicts.add((c_type, 'Moved existing file to',
 
2234
                               old_file, new_file))
 
2235
    return new_conflicts
 
2236
 
 
2237
 
 
2238
def new_by_entry(tt, entry, parent_id, tree):
 
2239
    """Create a new file according to its inventory entry"""
 
2240
    name = entry.name
 
2241
    kind = entry.kind
 
2242
    if kind == 'file':
 
2243
        contents = tree.get_file(entry.file_id).readlines()
 
2244
        executable = tree.is_executable(entry.file_id)
 
2245
        return tt.new_file(name, parent_id, contents, entry.file_id, 
 
2246
                           executable)
 
2247
    elif kind in ('directory', 'tree-reference'):
 
2248
        trans_id = tt.new_directory(name, parent_id, entry.file_id)
 
2249
        if kind == 'tree-reference':
 
2250
            tt.set_tree_reference(entry.reference_revision, trans_id)
 
2251
        return trans_id 
 
2252
    elif kind == 'symlink':
 
2253
        target = tree.get_symlink_target(entry.file_id)
 
2254
        return tt.new_symlink(name, parent_id, target, entry.file_id)
 
2255
    else:
 
2256
        raise errors.BadFileKindError(name, kind)
 
2257
 
 
2258
 
 
2259
@deprecated_function(deprecated_in((1, 9, 0)))
 
2260
def create_by_entry(tt, entry, tree, trans_id, lines=None, mode_id=None):
 
2261
    """Create new file contents according to an inventory entry.
 
2262
 
 
2263
    DEPRECATED.  Use create_from_tree instead.
 
2264
    """
 
2265
    if entry.kind == "file":
 
2266
        if lines is None:
 
2267
            lines = tree.get_file(entry.file_id).readlines()
 
2268
        tt.create_file(lines, trans_id, mode_id=mode_id)
 
2269
    elif entry.kind == "symlink":
 
2270
        tt.create_symlink(tree.get_symlink_target(entry.file_id), trans_id)
 
2271
    elif entry.kind == "directory":
 
2272
        tt.create_directory(trans_id)
 
2273
 
 
2274
 
 
2275
def create_from_tree(tt, trans_id, tree, file_id, bytes=None):
 
2276
    """Create new file contents according to tree contents."""
 
2277
    kind = tree.kind(file_id)
 
2278
    if kind == 'directory':
 
2279
        tt.create_directory(trans_id)
 
2280
    elif kind == "file":
 
2281
        if bytes is None:
 
2282
            tree_file = tree.get_file(file_id)
 
2283
            try:
 
2284
                bytes = tree_file.readlines()
 
2285
            finally:
 
2286
                tree_file.close()
 
2287
        tt.create_file(bytes, trans_id)
 
2288
    elif kind == "symlink":
 
2289
        tt.create_symlink(tree.get_symlink_target(file_id), trans_id)
 
2290
    else:
 
2291
        raise AssertionError('Unknown kind %r' % kind)
 
2292
 
 
2293
 
 
2294
def create_entry_executability(tt, entry, trans_id):
 
2295
    """Set the executability of a trans_id according to an inventory entry"""
 
2296
    if entry.kind == "file":
 
2297
        tt.set_executability(entry.executable, trans_id)
 
2298
 
 
2299
 
 
2300
def get_backup_name(entry, by_parent, parent_trans_id, tt):
 
2301
    return _get_backup_name(entry.name, by_parent, parent_trans_id, tt)
 
2302
 
 
2303
 
 
2304
def _get_backup_name(name, by_parent, parent_trans_id, tt):
 
2305
    """Produce a backup-style name that appears to be available"""
 
2306
    def name_gen():
 
2307
        counter = 1
 
2308
        while True:
 
2309
            yield "%s.~%d~" % (name, counter)
 
2310
            counter += 1
 
2311
    for new_name in name_gen():
 
2312
        if not tt.has_named_child(by_parent, parent_trans_id, new_name):
 
2313
            return new_name
 
2314
 
 
2315
 
 
2316
def _entry_changes(file_id, entry, working_tree):
 
2317
    """Determine in which ways the inventory entry has changed.
 
2318
 
 
2319
    Returns booleans: has_contents, content_mod, meta_mod
 
2320
    has_contents means there are currently contents, but they differ
 
2321
    contents_mod means contents need to be modified
 
2322
    meta_mod means the metadata needs to be modified
 
2323
    """
 
2324
    cur_entry = working_tree.inventory[file_id]
 
2325
    try:
 
2326
        working_kind = working_tree.kind(file_id)
 
2327
        has_contents = True
 
2328
    except NoSuchFile:
 
2329
        has_contents = False
 
2330
        contents_mod = True
 
2331
        meta_mod = False
 
2332
    if has_contents is True:
 
2333
        if entry.kind != working_kind:
 
2334
            contents_mod, meta_mod = True, False
 
2335
        else:
 
2336
            cur_entry._read_tree_state(working_tree.id2path(file_id), 
 
2337
                                       working_tree)
 
2338
            contents_mod, meta_mod = entry.detect_changes(cur_entry)
 
2339
            cur_entry._forget_tree_state()
 
2340
    return has_contents, contents_mod, meta_mod
 
2341
 
 
2342
 
 
2343
def revert(working_tree, target_tree, filenames, backups=False,
 
2344
           pb=DummyProgress(), change_reporter=None):
 
2345
    """Revert a working tree's contents to those of a target tree."""
 
2346
    target_tree.lock_read()
 
2347
    tt = TreeTransform(working_tree, pb)
 
2348
    try:
 
2349
        pp = ProgressPhase("Revert phase", 3, pb)
 
2350
        conflicts, merge_modified = _prepare_revert_transform(
 
2351
            working_tree, target_tree, tt, filenames, backups, pp)
 
2352
        if change_reporter:
 
2353
            change_reporter = delta._ChangeReporter(
 
2354
                unversioned_filter=working_tree.is_ignored)
 
2355
            delta.report_changes(tt.iter_changes(), change_reporter)
 
2356
        for conflict in conflicts:
 
2357
            warning(conflict)
 
2358
        pp.next_phase()
 
2359
        tt.apply()
 
2360
        working_tree.set_merge_modified(merge_modified)
 
2361
    finally:
 
2362
        target_tree.unlock()
 
2363
        tt.finalize()
 
2364
        pb.clear()
 
2365
    return conflicts
 
2366
 
 
2367
 
 
2368
def _prepare_revert_transform(working_tree, target_tree, tt, filenames,
 
2369
                              backups, pp, basis_tree=None,
 
2370
                              merge_modified=None):
 
2371
    pp.next_phase()
 
2372
    child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2373
    try:
 
2374
        if merge_modified is None:
 
2375
            merge_modified = working_tree.merge_modified()
 
2376
        merge_modified = _alter_files(working_tree, target_tree, tt,
 
2377
                                      child_pb, filenames, backups,
 
2378
                                      merge_modified, basis_tree)
 
2379
    finally:
 
2380
        child_pb.finished()
 
2381
    pp.next_phase()
 
2382
    child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2383
    try:
 
2384
        raw_conflicts = resolve_conflicts(tt, child_pb,
 
2385
            lambda t, c: conflict_pass(t, c, target_tree))
 
2386
    finally:
 
2387
        child_pb.finished()
 
2388
    conflicts = cook_conflicts(raw_conflicts, tt)
 
2389
    return conflicts, merge_modified
 
2390
 
 
2391
 
 
2392
def _alter_files(working_tree, target_tree, tt, pb, specific_files,
 
2393
                 backups, merge_modified, basis_tree=None):
 
2394
    if basis_tree is not None:
 
2395
        basis_tree.lock_read()
 
2396
    change_list = target_tree.iter_changes(working_tree,
 
2397
        specific_files=specific_files, pb=pb)
 
2398
    if target_tree.get_root_id() is None:
 
2399
        skip_root = True
 
2400
    else:
 
2401
        skip_root = False
 
2402
    try:
 
2403
        deferred_files = []
 
2404
        for id_num, (file_id, path, changed_content, versioned, parent, name,
 
2405
                kind, executable) in enumerate(change_list):
 
2406
            if skip_root and file_id[0] is not None and parent[0] is None:
 
2407
                continue
 
2408
            trans_id = tt.trans_id_file_id(file_id)
 
2409
            mode_id = None
 
2410
            if changed_content:
 
2411
                keep_content = False
 
2412
                if kind[0] == 'file' and (backups or kind[1] is None):
 
2413
                    wt_sha1 = working_tree.get_file_sha1(file_id)
 
2414
                    if merge_modified.get(file_id) != wt_sha1:
 
2415
                        # acquire the basis tree lazily to prevent the
 
2416
                        # expense of accessing it when it's not needed ?
 
2417
                        # (Guessing, RBC, 200702)
 
2418
                        if basis_tree is None:
 
2419
                            basis_tree = working_tree.basis_tree()
 
2420
                            basis_tree.lock_read()
 
2421
                        if file_id in basis_tree:
 
2422
                            if wt_sha1 != basis_tree.get_file_sha1(file_id):
 
2423
                                keep_content = True
 
2424
                        elif kind[1] is None and not versioned[1]:
 
2425
                            keep_content = True
 
2426
                if kind[0] is not None:
 
2427
                    if not keep_content:
 
2428
                        tt.delete_contents(trans_id)
 
2429
                    elif kind[1] is not None:
 
2430
                        parent_trans_id = tt.trans_id_file_id(parent[0])
 
2431
                        by_parent = tt.by_parent()
 
2432
                        backup_name = _get_backup_name(name[0], by_parent,
 
2433
                                                       parent_trans_id, tt)
 
2434
                        tt.adjust_path(backup_name, parent_trans_id, trans_id)
 
2435
                        new_trans_id = tt.create_path(name[0], parent_trans_id)
 
2436
                        if versioned == (True, True):
 
2437
                            tt.unversion_file(trans_id)
 
2438
                            tt.version_file(file_id, new_trans_id)
 
2439
                        # New contents should have the same unix perms as old
 
2440
                        # contents
 
2441
                        mode_id = trans_id
 
2442
                        trans_id = new_trans_id
 
2443
                if kind[1] in ('directory', 'tree-reference'):
 
2444
                    tt.create_directory(trans_id)
 
2445
                    if kind[1] == 'tree-reference':
 
2446
                        revision = target_tree.get_reference_revision(file_id,
 
2447
                                                                      path[1])
 
2448
                        tt.set_tree_reference(revision, trans_id)
 
2449
                elif kind[1] == 'symlink':
 
2450
                    tt.create_symlink(target_tree.get_symlink_target(file_id),
 
2451
                                      trans_id)
 
2452
                elif kind[1] == 'file':
 
2453
                    deferred_files.append((file_id, (trans_id, mode_id)))
 
2454
                    if basis_tree is None:
 
2455
                        basis_tree = working_tree.basis_tree()
 
2456
                        basis_tree.lock_read()
 
2457
                    new_sha1 = target_tree.get_file_sha1(file_id)
 
2458
                    if (file_id in basis_tree and new_sha1 ==
 
2459
                        basis_tree.get_file_sha1(file_id)):
 
2460
                        if file_id in merge_modified:
 
2461
                            del merge_modified[file_id]
 
2462
                    else:
 
2463
                        merge_modified[file_id] = new_sha1
 
2464
 
 
2465
                    # preserve the execute bit when backing up
 
2466
                    if keep_content and executable[0] == executable[1]:
 
2467
                        tt.set_executability(executable[1], trans_id)
 
2468
                elif kind[1] is not None:
 
2469
                    raise AssertionError(kind[1])
 
2470
            if versioned == (False, True):
 
2471
                tt.version_file(file_id, trans_id)
 
2472
            if versioned == (True, False):
 
2473
                tt.unversion_file(trans_id)
 
2474
            if (name[1] is not None and
 
2475
                (name[0] != name[1] or parent[0] != parent[1])):
 
2476
                if name[1] == '' and parent[1] is None:
 
2477
                    parent_trans = ROOT_PARENT
 
2478
                else:
 
2479
                    parent_trans = tt.trans_id_file_id(parent[1])
 
2480
                tt.adjust_path(name[1], parent_trans, trans_id)
 
2481
            if executable[0] != executable[1] and kind[1] == "file":
 
2482
                tt.set_executability(executable[1], trans_id)
 
2483
        for (trans_id, mode_id), bytes in target_tree.iter_files_bytes(
 
2484
            deferred_files):
 
2485
            tt.create_file(bytes, trans_id, mode_id)
 
2486
    finally:
 
2487
        if basis_tree is not None:
 
2488
            basis_tree.unlock()
 
2489
    return merge_modified
 
2490
 
 
2491
 
 
2492
def resolve_conflicts(tt, pb=DummyProgress(), pass_func=None):
 
2493
    """Make many conflict-resolution attempts, but die if they fail"""
 
2494
    if pass_func is None:
 
2495
        pass_func = conflict_pass
 
2496
    new_conflicts = set()
 
2497
    try:
 
2498
        for n in range(10):
 
2499
            pb.update('Resolution pass', n+1, 10)
 
2500
            conflicts = tt.find_conflicts()
 
2501
            if len(conflicts) == 0:
 
2502
                return new_conflicts
 
2503
            new_conflicts.update(pass_func(tt, conflicts))
 
2504
        raise MalformedTransform(conflicts=conflicts)
 
2505
    finally:
 
2506
        pb.clear()
 
2507
 
 
2508
 
 
2509
def conflict_pass(tt, conflicts, path_tree=None):
 
2510
    """Resolve some classes of conflicts.
 
2511
 
 
2512
    :param tt: The transform to resolve conflicts in
 
2513
    :param conflicts: The conflicts to resolve
 
2514
    :param path_tree: A Tree to get supplemental paths from
 
2515
    """
 
2516
    new_conflicts = set()
 
2517
    for c_type, conflict in ((c[0], c) for c in conflicts):
 
2518
        if c_type == 'duplicate id':
 
2519
            tt.unversion_file(conflict[1])
 
2520
            new_conflicts.add((c_type, 'Unversioned existing file',
 
2521
                               conflict[1], conflict[2], ))
 
2522
        elif c_type == 'duplicate':
 
2523
            # files that were renamed take precedence
 
2524
            final_parent = tt.final_parent(conflict[1])
 
2525
            if tt.path_changed(conflict[1]):
 
2526
                existing_file, new_file = conflict[2], conflict[1]
 
2527
            else:
 
2528
                existing_file, new_file = conflict[1], conflict[2]
 
2529
            new_name = tt.final_name(existing_file)+'.moved'
 
2530
            tt.adjust_path(new_name, final_parent, existing_file)
 
2531
            new_conflicts.add((c_type, 'Moved existing file to', 
 
2532
                               existing_file, new_file))
 
2533
        elif c_type == 'parent loop':
 
2534
            # break the loop by undoing one of the ops that caused the loop
 
2535
            cur = conflict[1]
 
2536
            while not tt.path_changed(cur):
 
2537
                cur = tt.final_parent(cur)
 
2538
            new_conflicts.add((c_type, 'Cancelled move', cur,
 
2539
                               tt.final_parent(cur),))
 
2540
            tt.adjust_path(tt.final_name(cur), tt.get_tree_parent(cur), cur)
 
2541
            
 
2542
        elif c_type == 'missing parent':
 
2543
            trans_id = conflict[1]
 
2544
            try:
 
2545
                tt.cancel_deletion(trans_id)
 
2546
                new_conflicts.add(('deleting parent', 'Not deleting', 
 
2547
                                   trans_id))
 
2548
            except KeyError:
 
2549
                create = True
 
2550
                try:
 
2551
                    tt.final_name(trans_id)
 
2552
                except NoFinalPath:
 
2553
                    if path_tree is not None:
 
2554
                        file_id = tt.final_file_id(trans_id)
 
2555
                        if file_id is None:
 
2556
                            file_id = tt.inactive_file_id(trans_id)
 
2557
                        entry = path_tree.inventory[file_id]
 
2558
                        # special-case the other tree root (move its
 
2559
                        # children to current root)
 
2560
                        if entry.parent_id is None:
 
2561
                            create=False
 
2562
                            moved = _reparent_transform_children(
 
2563
                                tt, trans_id, tt.root)
 
2564
                            for child in moved:
 
2565
                                new_conflicts.add((c_type, 'Moved to root',
 
2566
                                                   child))
 
2567
                        else:
 
2568
                            parent_trans_id = tt.trans_id_file_id(
 
2569
                                entry.parent_id)
 
2570
                            tt.adjust_path(entry.name, parent_trans_id,
 
2571
                                           trans_id)
 
2572
                if create:
 
2573
                    tt.create_directory(trans_id)
 
2574
                    new_conflicts.add((c_type, 'Created directory', trans_id))
 
2575
        elif c_type == 'unversioned parent':
 
2576
            file_id = tt.inactive_file_id(conflict[1])
 
2577
            # special-case the other tree root (move its children instead)
 
2578
            if path_tree and file_id in path_tree:
 
2579
                if path_tree.inventory[file_id].parent_id is None:
 
2580
                    continue
 
2581
            tt.version_file(file_id, conflict[1])
 
2582
            new_conflicts.add((c_type, 'Versioned directory', conflict[1]))
 
2583
        elif c_type == 'non-directory parent':
 
2584
            parent_id = conflict[1]
 
2585
            parent_parent = tt.final_parent(parent_id)
 
2586
            parent_name = tt.final_name(parent_id)
 
2587
            parent_file_id = tt.final_file_id(parent_id)
 
2588
            new_parent_id = tt.new_directory(parent_name + '.new',
 
2589
                parent_parent, parent_file_id)
 
2590
            _reparent_transform_children(tt, parent_id, new_parent_id)
 
2591
            if parent_file_id is not None:
 
2592
                tt.unversion_file(parent_id)
 
2593
            new_conflicts.add((c_type, 'Created directory', new_parent_id))
 
2594
        elif c_type == 'versioning no contents':
 
2595
            tt.cancel_versioning(conflict[1])
 
2596
    return new_conflicts
 
2597
 
 
2598
 
 
2599
def cook_conflicts(raw_conflicts, tt):
 
2600
    """Generate a list of cooked conflicts, sorted by file path"""
 
2601
    from bzrlib.conflicts import Conflict
 
2602
    conflict_iter = iter_cook_conflicts(raw_conflicts, tt)
 
2603
    return sorted(conflict_iter, key=Conflict.sort_key)
 
2604
 
 
2605
 
 
2606
def iter_cook_conflicts(raw_conflicts, tt):
 
2607
    from bzrlib.conflicts import Conflict
 
2608
    fp = FinalPaths(tt)
 
2609
    for conflict in raw_conflicts:
 
2610
        c_type = conflict[0]
 
2611
        action = conflict[1]
 
2612
        modified_path = fp.get_path(conflict[2])
 
2613
        modified_id = tt.final_file_id(conflict[2])
 
2614
        if len(conflict) == 3:
 
2615
            yield Conflict.factory(c_type, action=action, path=modified_path,
 
2616
                                     file_id=modified_id)
 
2617
             
 
2618
        else:
 
2619
            conflicting_path = fp.get_path(conflict[3])
 
2620
            conflicting_id = tt.final_file_id(conflict[3])
 
2621
            yield Conflict.factory(c_type, action=action, path=modified_path,
 
2622
                                   file_id=modified_id, 
 
2623
                                   conflict_path=conflicting_path,
 
2624
                                   conflict_file_id=conflicting_id)
 
2625
 
 
2626
 
 
2627
class _FileMover(object):
 
2628
    """Moves and deletes files for TreeTransform, tracking operations"""
 
2629
 
 
2630
    def __init__(self):
 
2631
        self.past_renames = []
 
2632
        self.pending_deletions = []
 
2633
 
 
2634
    def rename(self, from_, to):
 
2635
        """Rename a file from one path to another.  Functions like os.rename"""
 
2636
        try:
 
2637
            os.rename(from_, to)
 
2638
        except OSError, e:
 
2639
            if e.errno in (errno.EEXIST, errno.ENOTEMPTY):
 
2640
                raise errors.FileExists(to, str(e))
 
2641
            raise
 
2642
        self.past_renames.append((from_, to))
 
2643
 
 
2644
    def pre_delete(self, from_, to):
 
2645
        """Rename a file out of the way and mark it for deletion.
 
2646
 
 
2647
        Unlike os.unlink, this works equally well for files and directories.
 
2648
        :param from_: The current file path
 
2649
        :param to: A temporary path for the file
 
2650
        """
 
2651
        self.rename(from_, to)
 
2652
        self.pending_deletions.append(to)
 
2653
 
 
2654
    def rollback(self):
 
2655
        """Reverse all renames that have been performed"""
 
2656
        for from_, to in reversed(self.past_renames):
 
2657
            os.rename(to, from_)
 
2658
        # after rollback, don't reuse _FileMover
 
2659
        past_renames = None
 
2660
        pending_deletions = None
 
2661
 
 
2662
    def apply_deletions(self):
 
2663
        """Apply all marked deletions"""
 
2664
        for path in self.pending_deletions:
 
2665
            delete_any(path)
 
2666
        # after apply_deletions, don't reuse _FileMover
 
2667
        past_renames = None
 
2668
        pending_deletions = None