~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: mbp at sourcefrog
Date: 2005-04-04 13:57:54 UTC
Revision ID: mbp@sourcefrog.net-20050404135754-ae2e4e5fb0094c91

- Write .bzr.log in utf8

files added:
bzrlib/tests.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/faq.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quickref.txt

doc/quilt.txt

doc/random.txt

doc/requirements.txt

doc/revision-syntax.txt

doc/roadmap.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/tagging.txt

doc/taxonomy.txt

doc/testing.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/work-order.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/new-inventory-sample.xml

notes/performance.txt

files removed:
.rsyncexclude

BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS.developers

TODO

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revprops.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

generate_docs.py

profile_imports.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

files renamed:
contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/store/__init__.py => bzrlib/store.py

bzrlib/xml_serializer.py => bzrlib/xml.py

bzrlib/util/elementtree/ => elementtree/

files modified:
.bzrignore

NEWS

README

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

elementtree/ElementTree.py

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: This refactoring of the workingtree code doesn't seem to keep

# the WorkingTree's copy of the inventory in sync with the branch. The

# branch modifies its working inventory when it does a commit to make

# missing files permanently removed.

# TODO: Maybe also keep the full path of the entry, and the children?

# But those depend on its position within a particular inventory, and

# it would be nice not to need to hold the backpointer here.

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import collections

import os.path

import re

import sys

import tarfile

import types

"""Inventories map files to their name in a revision."""

# TODO: Maybe store inventory_id in the file? Not really needed.

__author__ = "Martin Pool <mbp@canonical.com>"

import sys, os.path, types, re

from sets import Set

try:

from cElementTree import Element, ElementTree, SubElement

except ImportError:

from elementtree.ElementTree import Element, ElementTree, SubElement

from xml import XMLMixin

from errors import bailout

import bzrlib

from bzrlib import errors, osutils

from bzrlib.osutils import (pumpfile, quotefn, splitpath, joinpath,

pathjoin, sha_strings)

from bzrlib.errors import (NotVersionedError, InvalidEntryName,

BzrError, BzrCheckError, BinaryFile)

from bzrlib.osutils import uuid, quotefn, splitpath, joinpath, appendpath

from bzrlib.trace import mutter

class InventoryEntry(object):

class InventoryEntry(XMLMixin):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

file_id

name

(within the parent directory)

parent_id

file_id of the parent directory, or ROOT_ID

revision

the revision_id in which this variation of this file was

introduced.

executable

Indicates that this file should be executable on systems

that support it.

text_sha1

sha-1 of the text of the file

text_size

size in bytes of the text of the file

(reading a version 4 tree created a text_id field.)

* *file_id*

* *name*: (only the basename within the directory, must not

contain slashes)

* *kind*: "directory" or "file"

* *directory_id*: (if absent/null means the branch root directory)

* *text_sha1*: only for files

* *text_size*: in bytes, only for files

* *text_id*: identifier for the text version, only for files

InventoryEntries can also exist inside a WorkingTree

inventory, in which case they are not yet bound to a

particular revision of the file. In that case the text_sha1,

text_size and text_id are absent.

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))

InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None)

>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))

InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None)

>>> shouldbe = {0: '', 1: 'src', 2: pathjoin('src','hello.c')}

>>> for ix, j in enumerate(i.iter_entries()):

... print (j[0] == shouldbe[ix], j[1])

>>> i.add(InventoryEntry('123', 'src', kind='directory'))

>>> i.add(InventoryEntry('2323', 'hello.c', parent_id='123'))

>>> for j in i.iter_entries():

... print j

...

(True, RootEntry('TREE_ROOT', u'', parent_id=None, revision=None))

(True, InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None))

(True, InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None))

>>> i.add(InventoryFile('2323', 'bye.c', '123'))

('src', InventoryEntry('123', 'src', kind='directory', parent_id=None))

('src/hello.c', InventoryEntry('2323', 'hello.c', kind='file', parent_id='123'))

>>> i.add(InventoryEntry('2323', 'bye.c', parent_id='123'))

Traceback (most recent call last):

...

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryFile('2324', 'bye.c', '123'))

InventoryFile('2324', 'bye.c', parent_id='123', sha1=None, len=None)

>>> i.add(InventoryDirectory('2325', 'wibble', '123'))

InventoryDirectory('2325', 'wibble', parent_id='123', revision=None)

BzrError: ('inventory already contains entry with id {2323}', [])

>>> i.add(InventoryEntry('2324', 'bye.c', parent_id='123'))

>>> i.add(InventoryEntry('2325', 'wibble', parent_id='123', kind='directory'))

>>> i.path2id('src/wibble')

100

'2325'

101

>>> '2325' in i

102

True

103

>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))

104

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

>>> i.add(InventoryEntry('2326', 'wibble.c', parent_id='2325'))

105

>>> i['2326']

106

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

107

>>> for path, entry in i.iter_entries():

108

... print path

109

... assert i.path2id(path)

InventoryEntry('2326', 'wibble.c', kind='file', parent_id='2325')

>>> for j in i.iter_entries():

... print j[0]

... assert i.path2id(j[0])

110

...

111

112

src

113

src/bye.c

114

src/hello.c

116

src/wibble/wibble.c

117

>>> i.id2path('2326')

118

'src/wibble/wibble.c'

:todo: Maybe also keep the full path of the entry, and the children?

But those depend on its position within a particular inventory, and

it would be nice not to need to hold the backpointer here.

119

"""

120

121

# Constants returned by describe_change()

122

123

# TODO: These should probably move to some kind of FileChangeDescription

124

# class; that's like what's inside a TreeDelta but we want to be able to

125

# generate them just for one file at a time.

126

RENAMED = 'renamed'

127

MODIFIED_AND_RENAMED = 'modified and renamed'

128

129

__slots__ = []

130

131

def detect_changes(self, old_entry):

132

"""Return a (text_modified, meta_modified) from this to old_entry.

133

134

_read_tree_state must have been called on self and old_entry prior to

135

calling detect_changes.

136

"""

137

return False, False

138

139

def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

140

output_to, reverse=False):

141

"""Perform a diff from this to to_entry.

142

143

text_diff will be used for textual difference calculation.

144

This is a template method, override _diff in child classes.

145

"""

146

self._read_tree_state(tree.id2path(self.file_id), tree)

147

if to_entry:

148

# cannot diff from one kind to another - you must do a removal

149

# and an addif they do not match.

150

assert self.kind == to_entry.kind

151

to_entry._read_tree_state(to_tree.id2path(to_entry.file_id),

152

to_tree)

153

self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,

154

output_to, reverse)

155

156

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

157

output_to, reverse=False):

158

"""Perform a diff between two entries of the same kind."""

159

160

def find_previous_heads(self, previous_inventories,

161

versioned_file_store,

162

transaction,

163

entry_vf=None):

164

"""Return the revisions and entries that directly precede this.

165

166

Returned as a map from revision to inventory entry.

167

168

This is a map containing the file revisions in all parents

169

for which the file exists, and its revision is not a parent of

170

any other. If the file is new, the set will be empty.

171

172

:param versioned_file_store: A store where ancestry data on this

173

file id can be queried.

174

:param transaction: The transaction that queries to the versioned

175

file store should be completed under.

176

:param entry_vf: The entry versioned file, if its already available.

177

"""

178

def get_ancestors(weave, entry):

179

return set(weave.get_ancestry(entry.revision))

180

# revision:ie mapping for each ie found in previous_inventories.

181

candidates = {}

182

# revision:ie mapping with one revision for each head.

183

heads = {}

184

# revision: ancestor list for each head

185

head_ancestors = {}

186

# identify candidate head revision ids.

187

for inv in previous_inventories:

188

if self.file_id in inv:

189

ie = inv[self.file_id]

190

assert ie.file_id == self.file_id

191

if ie.revision in candidates:

192

# same revision value in two different inventories:

193

# correct possible inconsistencies:

194

# * there was a bug in revision updates with 'x' bit

195

# support.

196

try:

197

if candidates[ie.revision].executable != ie.executable:

198

candidates[ie.revision].executable = False

199

ie.executable = False

200

except AttributeError:

201

pass

202

# must now be the same.

203

assert candidates[ie.revision] == ie

204

else:

205

# add this revision as a candidate.

206

candidates[ie.revision] = ie

207

208

# common case optimisation

209

if len(candidates) == 1:

210

# if there is only one candidate revision found

211

# then we can opening the versioned file to access ancestry:

212

# there cannot be any ancestors to eliminate when there is

213

# only one revision available.

214

heads[ie.revision] = ie

215

return heads

216

217

# eliminate ancestors amongst the available candidates:

218

# heads are those that are not an ancestor of any other candidate

219

# - this provides convergence at a per-file level.

220

for ie in candidates.values():

221

# may be an ancestor of a known head:

222

already_present = 0 != len(

223

[head for head in heads

224

if ie.revision in head_ancestors[head]])

225

if already_present:

226

# an ancestor of an analyzed candidate.

227

continue

228

# not an ancestor of a known head:

229

# load the versioned file for this file id if needed

230

if entry_vf is None:

231

entry_vf = versioned_file_store.get_weave_or_empty(

232

self.file_id, transaction)

233

ancestors = get_ancestors(entry_vf, ie)

234

# may knock something else out:

235

check_heads = list(heads.keys())

236

for head in check_heads:

237

if head in ancestors:

238

# this previously discovered 'head' is not

239

# really a head - its an ancestor of the newly

240

# found head,

241

heads.pop(head)

242

head_ancestors[ie.revision] = ancestors

243

heads[ie.revision] = ie

244

return heads

245

246

def get_tar_item(self, root, dp, now, tree):

247

"""Get a tarfile item and a file stream for its content."""

248

item = tarfile.TarInfo(pathjoin(root, dp))

249

# TODO: would be cool to actually set it to the timestamp of the

250

# revision it was last changed

251

item.mtime = now

252

fileobj = self._put_in_tar(item, tree)

253

return item, fileobj

254

255

def has_text(self):

256

"""Return true if the object this entry represents has textual data.

257

258

Note that textual data includes binary content.

259

260

Also note that all entries get weave files created for them.

261

This attribute is primarily used when upgrading from old trees that

262

did not have the weave index for all inventory entries.

263

"""

264

return False

265

266

def __init__(self, file_id, name, parent_id, text_id=None):

def __init__(self, file_id, name, kind='file', text_id=None,

parent_id=None):

267

100

"""Create an InventoryEntry

268

101

269

102

The filename must be a single component, relative to the

270

103

parent directory; it cannot be a whole path or relative name.

271

104

272

>>> e = InventoryFile('123', 'hello.c', ROOT_ID)

105

>>> e = InventoryEntry('123', 'hello.c')

273

106

>>> e.name

274

107

'hello.c'

275

108

>>> e.file_id

276

109

'123'

277

>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)

110

>>> e = InventoryEntry('123', 'src/hello.c')

278

111

Traceback (most recent call last):

279

InvalidEntryName: Invalid entry name: src/hello.c

112

BzrError: ("InventoryEntry name is not a simple filename: 'src/hello.c'", [])

280

113

"""

281

assert isinstance(name, basestring), name

282

if '/' in name or '\\' in name:

283

raise InvalidEntryName(name=name)

284

self.executable = False

285

self.revision = None

286

self.text_sha1 = None

287

self.text_size = None

114

115

if len(splitpath(name)) != 1:

116

bailout('InventoryEntry name is not a simple filename: %r'

117

% name)

118

288

119

self.file_id = file_id

289

120

self.name = name

121

assert kind in ['file', 'directory']

122

self.kind = kind

290

123

self.text_id = text_id

291

124

self.parent_id = parent_id

292

self.symlink_target = None

293

294

def kind_character(self):

295

"""Return a short kind indicator useful for appending to names."""

296

raise BzrError('unknown kind %r' % self.kind)

297

298

known_kinds = ('file', 'directory', 'symlink', 'root_directory')

299

300

def _put_in_tar(self, item, tree):

301

"""populate item for stashing in a tar, and return the content stream.

302

303

If no content is available, return None.

304

"""

305

raise BzrError("don't know how to export {%s} of kind %r" %

306

(self.file_id, self.kind))

307

308

def put_on_disk(self, dest, dp, tree):

309

"""Create a representation of self on disk in the prefix dest.

310

311

This is a template method - implement _put_on_disk in subclasses.

312

"""

313

fullpath = pathjoin(dest, dp)

314

self._put_on_disk(fullpath, tree)

315

# mutter(" export {%s} kind %s to %s", self.file_id,

316

# self.kind, fullpath)

317

318

def _put_on_disk(self, fullpath, tree):

319

"""Put this entry onto disk at fullpath, from tree tree."""

320

raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))

125

self.text_sha1 = None

126

self.text_size = None

127

if kind == 'directory':

128

self.children = {}

129

321

130

322

131

def sorted_children(self):

323

return sorted(self.children.items())

324

325

@staticmethod

326

def versionable_kind(kind):

327

return kind in ('file', 'directory', 'symlink')

328

329

def check(self, checker, rev_id, inv, tree):

330

"""Check this inventory entry is intact.

331

332

This is a template method, override _check for kind specific

333

tests.

334

335

:param checker: Check object providing context for the checks;

336

can be used to find out what parts of the repository have already

337

been checked.

338

:param rev_id: Revision id from which this InventoryEntry was loaded.

339

Not necessarily the last-changed revision for this file.

340

:param inv: Inventory from which the entry was loaded.

341

:param tree: RevisionTree for this entry.

342

"""

343

if self.parent_id is not None:

344

if not inv.has_id(self.parent_id):

345

raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'

346

% (self.parent_id, rev_id))

347

self._check(checker, rev_id, tree)

348

349

def _check(self, checker, rev_id, tree):

350

"""Check this inventory entry for kind specific errors."""

351

raise BzrCheckError('unknown entry kind %r in revision {%s}' %

352

(self.kind, rev_id))

132

l = self.children.items()

133

l.sort()

134

return l

135

353

136

354

137

def copy(self):

355

"""Clone this inventory entry."""

356

raise NotImplementedError

357

358

@staticmethod

359

def describe_change(old_entry, new_entry):

360

"""Describe the change between old_entry and this.

361

362

This smells of being an InterInventoryEntry situation, but as its

363

the first one, we're making it a static method for now.

364

365

An entry with a different parent, or different name is considered

366

to be renamed. Reparenting is an internal detail.

367

Note that renaming the parent does not trigger a rename for the

368

child entry itself.

369

"""

370

# TODO: Perhaps return an object rather than just a string

371

if old_entry is new_entry:

372

# also the case of both being None

373

return 'unchanged'

374

elif old_entry is None:

375

return 'added'

376

elif new_entry is None:

377

return 'removed'

378

text_modified, meta_modified = new_entry.detect_changes(old_entry)

379

if text_modified or meta_modified:

380

modified = True

381

else:

382

modified = False

383

# TODO 20060511 (mbp, rbc) factor out 'detect_rename' here.

384

if old_entry.parent_id != new_entry.parent_id:

385

renamed = True

386

elif old_entry.name != new_entry.name:

387

renamed = True

388

else:

389

renamed = False

390

if renamed and not modified:

391

return InventoryEntry.RENAMED

392

if modified and not renamed:

393

return 'modified'

394

if modified and renamed:

395

return InventoryEntry.MODIFIED_AND_RENAMED

396

return 'unchanged'

138

other = InventoryEntry(self.file_id, self.name, self.kind,

139

self.text_id, self.parent_id)

140

other.text_sha1 = self.text_sha1

141

other.text_size = self.text_size

142

return other

143

397

144

398

145

def __repr__(self):

399

return ("%s(%r, %r, parent_id=%r, revision=%r)"

146

return ("%s(%r, %r, kind=%r, parent_id=%r)"

400

147

% (self.__class__.__name__,

401

148

self.file_id,

402

149

self.name,

403

self.parent_id,

404

self.revision))

405

406

def snapshot(self, revision, path, previous_entries,

407

work_tree, commit_builder):

408

"""Make a snapshot of this entry which may or may not have changed.

409

410

This means that all its fields are populated, that it has its

411

text stored in the text store or weave.

412

"""

413

# mutter('new parents of %s are %r', path, previous_entries)

414

self._read_tree_state(path, work_tree)

415

# TODO: Where should we determine whether to reuse a

416

# previous revision id or create a new revision? 20060606

417

if len(previous_entries) == 1:

418

# cannot be unchanged unless there is only one parent file rev.

419

parent_ie = previous_entries.values()[0]

420

if self._unchanged(parent_ie):

421

# mutter("found unchanged entry")

422

self.revision = parent_ie.revision

423

return "unchanged"

424

return self._snapshot_into_revision(revision, previous_entries,

425

work_tree, commit_builder)

426

427

def _snapshot_into_revision(self, revision, previous_entries, work_tree,

428

commit_builder):

429

"""Record this revision unconditionally into a store.

430

431

The entry's last-changed revision property (`revision`) is updated to

432

that of the new revision.

433

434

:param revision: id of the new revision that is being recorded.

435

436

:returns: String description of the commit (e.g. "merged", "modified"), etc.

437

"""

438

# mutter('new revision {%s} for {%s}', revision, self.file_id)

439

self.revision = revision

440

self._snapshot_text(previous_entries, work_tree, commit_builder)

441

442

def _snapshot_text(self, file_parents, work_tree, commit_builder):

443

"""Record the 'text' of this entry, whatever form that takes.

444

445

This default implementation simply adds an empty text.

446

"""

447

raise NotImplementedError(self._snapshot_text)

448

449

def __eq__(self, other):

150

self.kind,

151

self.parent_id))

152

153

154

def to_element(self):

155

"""Convert to XML element"""

156

e = Element('entry')

157

158

e.set('name', self.name)

159

e.set('file_id', self.file_id)

160

e.set('kind', self.kind)

161

162

if self.text_size is not None:

163

e.set('text_size', '%d' % self.text_size)

164

165

for f in ['text_id', 'text_sha1', 'parent_id']:

166

v = getattr(self, f)

167

if v is not None:

168

e.set(f, v)

169

170

e.tail = '\n'

171

172

return e

173

174

175

def from_element(cls, elt):

176

assert elt.tag == 'entry'

177

self = cls(elt.get('file_id'), elt.get('name'), elt.get('kind'))

178

self.text_id = elt.get('text_id')

179

self.text_sha1 = elt.get('text_sha1')

180

self.parent_id = elt.get('parent_id')

181

182

## mutter("read inventoryentry: %r" % (elt.attrib))

183

184

v = elt.get('text_size')

185

self.text_size = v and int(v)

186

187

return self

188

189

190

from_element = classmethod(from_element)

191

192

def __cmp__(self, other):

193

if self is other:

194

return 0

450

195

if not isinstance(other, InventoryEntry):

451

196

return NotImplemented

452

197

453

return ((self.file_id == other.file_id)

454

and (self.name == other.name)

455

and (other.symlink_target == self.symlink_target)

456

and (self.text_sha1 == other.text_sha1)

457

and (self.text_size == other.text_size)

458

and (self.text_id == other.text_id)

459

and (self.parent_id == other.parent_id)

460

and (self.kind == other.kind)

461

and (self.revision == other.revision)

462

and (self.executable == other.executable)

463

)

464

465

def __ne__(self, other):

466

return not (self == other)

467

468

def __hash__(self):

469

raise ValueError('not hashable')

470

471

def _unchanged(self, previous_ie):

472

"""Has this entry changed relative to previous_ie.

473

474

This method should be overridden in child classes.

475

"""

476

compatible = True

477

# different inv parent

478

if previous_ie.parent_id != self.parent_id:

479

compatible = False

480

# renamed

481

elif previous_ie.name != self.name:

482

compatible = False

483

return compatible

484

485

def _read_tree_state(self, path, work_tree):

486

"""Populate fields in the inventory entry from the given tree.

487

488

Note that this should be modified to be a noop on virtual trees

489

as all entries created there are prepopulated.

490

"""

491

# TODO: Rather than running this manually, we should check the

492

# working sha1 and other expensive properties when they're

493

# first requested, or preload them if they're already known

494

pass # nothing to do by default

495

496

def _forget_tree_state(self):

497

pass

198

return cmp(self.file_id, other.file_id) \

199

or cmp(self.name, other.name) \

200

or cmp(self.text_sha1, other.text_sha1) \

201

or cmp(self.text_size, other.text_size) \

202

or cmp(self.text_id, other.text_id) \

203

or cmp(self.parent_id, other.parent_id) \

204

or cmp(self.kind, other.kind)

205

498

206

499

207

500

208

class RootEntry(InventoryEntry):

501

502

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

503

'text_id', 'parent_id', 'children', 'executable',

504

'revision', 'symlink_target']

505

506

def _check(self, checker, rev_id, tree):

507

"""See InventoryEntry._check"""

508

509

209

def __init__(self, file_id):

510

210

self.file_id = file_id

511

211

self.children = {}

512

212

self.kind = 'root_directory'

513

213

self.parent_id = None

514

self.name = u''

515

self.revision = None

214

self.name = ''

516

215

517

def __eq__(self, other):

216

def __cmp__(self, other):

217

if self is other:

218

return 0

518

219

if not isinstance(other, RootEntry):

519

220

return NotImplemented

520

521

return (self.file_id == other.file_id) \

522

and (self.children == other.children)

523

524

525

class InventoryDirectory(InventoryEntry):

526

"""A directory in an inventory."""

527

528

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

529

'text_id', 'parent_id', 'children', 'executable',

530

'revision', 'symlink_target']

531

532

def _check(self, checker, rev_id, tree):

533

"""See InventoryEntry._check"""

534

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

535

raise BzrCheckError('directory {%s} has text in revision {%s}'

536

% (self.file_id, rev_id))

537

538

def copy(self):

539

other = InventoryDirectory(self.file_id, self.name, self.parent_id)

540

other.revision = self.revision

541

# note that children are *not* copied; they're pulled across when

542

# others are added

543

return other

544

545

def __init__(self, file_id, name, parent_id):

546

super(InventoryDirectory, self).__init__(file_id, name, parent_id)

547

self.children = {}

548

self.kind = 'directory'

549

550

def kind_character(self):

551

"""See InventoryEntry.kind_character."""

552

return '/'

553

554

def _put_in_tar(self, item, tree):

555

"""See InventoryEntry._put_in_tar."""

556

item.type = tarfile.DIRTYPE

557

fileobj = None

558

item.name += '/'

559

item.size = 0

560

item.mode = 0755

561

return fileobj

562

563

def _put_on_disk(self, fullpath, tree):

564

"""See InventoryEntry._put_on_disk."""

565

os.mkdir(fullpath)

566

567

def _snapshot_text(self, file_parents, work_tree, commit_builder):

568

"""See InventoryEntry._snapshot_text."""

569

commit_builder.modified_directory(self.file_id, file_parents)

570

571

572

class InventoryFile(InventoryEntry):

573

"""A file in an inventory."""

574

575

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

576

'text_id', 'parent_id', 'children', 'executable',

577

'revision', 'symlink_target']

578

579

def _check(self, checker, tree_revision_id, tree):

580

"""See InventoryEntry._check"""

581

t = (self.file_id, self.revision)

582

if t in checker.checked_texts:

583

prev_sha = checker.checked_texts[t]

584

if prev_sha != self.text_sha1:

585

raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %

586

(self.file_id, tree_revision_id))

587

else:

588

checker.repeated_text_cnt += 1

589

return

590

591

if self.file_id not in checker.checked_weaves:

592

mutter('check weave {%s}', self.file_id)

593

w = tree.get_weave(self.file_id)

594

# Not passing a progress bar, because it creates a new

595

# progress, which overwrites the current progress,

596

# and doesn't look nice

597

w.check()

598

checker.checked_weaves[self.file_id] = True

599

else:

600

w = tree.get_weave(self.file_id)

601

602

mutter('check version {%s} of {%s}', tree_revision_id, self.file_id)

603

checker.checked_text_cnt += 1

604

# We can't check the length, because Weave doesn't store that

605

# information, and the whole point of looking at the weave's

606

# sha1sum is that we don't have to extract the text.

607

if self.text_sha1 != w.get_sha1(self.revision):

608

raise BzrCheckError('text {%s} version {%s} wrong sha1'

609

% (self.file_id, self.revision))

610

checker.checked_texts[t] = self.text_sha1

611

612

def copy(self):

613

other = InventoryFile(self.file_id, self.name, self.parent_id)

614

other.executable = self.executable

615

other.text_id = self.text_id

616

other.text_sha1 = self.text_sha1

617

other.text_size = self.text_size

618

other.revision = self.revision

619

return other

620

621

def detect_changes(self, old_entry):

622

"""See InventoryEntry.detect_changes."""

623

assert self.text_sha1 is not None

624

assert old_entry.text_sha1 is not None

625

text_modified = (self.text_sha1 != old_entry.text_sha1)

626

meta_modified = (self.executable != old_entry.executable)

627

return text_modified, meta_modified

628

629

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

630

output_to, reverse=False):

631

"""See InventoryEntry._diff."""

632

try:

633

from_text = tree.get_file(self.file_id).readlines()

634

if to_entry:

635

to_text = to_tree.get_file(to_entry.file_id).readlines()

636

else:

637

to_text = []

638

if not reverse:

639

text_diff(from_label, from_text,

640

to_label, to_text, output_to)

641

else:

642

text_diff(to_label, to_text,

643

from_label, from_text, output_to)

644

except BinaryFile:

645

if reverse:

646

label_pair = (to_label, from_label)

647

else:

648

label_pair = (from_label, to_label)

649

print >> output_to, "Binary files %s and %s differ" % label_pair

650

651

def has_text(self):

652

"""See InventoryEntry.has_text."""

653

return True

654

655

def __init__(self, file_id, name, parent_id):

656

super(InventoryFile, self).__init__(file_id, name, parent_id)

657

self.kind = 'file'

658

659

def kind_character(self):

660

"""See InventoryEntry.kind_character."""

661

return ''

662

663

def _put_in_tar(self, item, tree):

664

"""See InventoryEntry._put_in_tar."""

665

item.type = tarfile.REGTYPE

666

fileobj = tree.get_file(self.file_id)

667

item.size = self.text_size

668

if tree.is_executable(self.file_id):

669

item.mode = 0755

670

else:

671

item.mode = 0644

672

return fileobj

673

674

def _put_on_disk(self, fullpath, tree):

675

"""See InventoryEntry._put_on_disk."""

676

pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))

677

if tree.is_executable(self.file_id):

678

os.chmod(fullpath, 0755)

679

680

def _read_tree_state(self, path, work_tree):

681

"""See InventoryEntry._read_tree_state."""

682

self.text_sha1 = work_tree.get_file_sha1(self.file_id, path=path)

683

# FIXME: 20050930 probe for the text size when getting sha1

684

# in _read_tree_state

685

self.executable = work_tree.is_executable(self.file_id, path=path)

686

687

def __repr__(self):

688

return ("%s(%r, %r, parent_id=%r, sha1=%r, len=%s)"

689

% (self.__class__.__name__,

690

self.file_id,

691

self.name,

692

self.parent_id,

693

self.text_sha1,

694

self.text_size))

695

696

def _forget_tree_state(self):

697

self.text_sha1 = None

698

699

def _snapshot_text(self, file_parents, work_tree, commit_builder):

700

"""See InventoryEntry._snapshot_text."""

701

def get_content_byte_lines():

702

return work_tree.get_file(self.file_id).readlines()

703

self.text_sha1, self.text_size = commit_builder.modified_file_text(

704

self.file_id, file_parents, get_content_byte_lines, self.text_sha1, self.text_size)

705

706

def _unchanged(self, previous_ie):

707

"""See InventoryEntry._unchanged."""

708

compatible = super(InventoryFile, self)._unchanged(previous_ie)

709

if self.text_sha1 != previous_ie.text_sha1:

710

compatible = False

711

else:

712

# FIXME: 20050930 probe for the text size when getting sha1

713

# in _read_tree_state

714

self.text_size = previous_ie.text_size

715

if self.executable != previous_ie.executable:

716

compatible = False

717

return compatible

718

719

720

class InventoryLink(InventoryEntry):

721

"""A file in an inventory."""

722

723

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

724

'text_id', 'parent_id', 'children', 'executable',

725

'revision', 'symlink_target']

726

727

def _check(self, checker, rev_id, tree):

728

"""See InventoryEntry._check"""

729

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

730

raise BzrCheckError('symlink {%s} has text in revision {%s}'

731

% (self.file_id, rev_id))

732

if self.symlink_target is None:

733

raise BzrCheckError('symlink {%s} has no target in revision {%s}'

734

% (self.file_id, rev_id))

735

736

def copy(self):

737

other = InventoryLink(self.file_id, self.name, self.parent_id)

738

other.symlink_target = self.symlink_target

739

other.revision = self.revision

740

return other

741

742

def detect_changes(self, old_entry):

743

"""See InventoryEntry.detect_changes."""

744

# FIXME: which _modified field should we use ? RBC 20051003

745

text_modified = (self.symlink_target != old_entry.symlink_target)

746

if text_modified:

747

mutter(" symlink target changed")

748

meta_modified = False

749

return text_modified, meta_modified

750

751

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

752

output_to, reverse=False):

753

"""See InventoryEntry._diff."""

754

from_text = self.symlink_target

755

if to_entry is not None:

756

to_text = to_entry.symlink_target

757

if reverse:

758

temp = from_text

759

from_text = to_text

760

to_text = temp

761

print >>output_to, '=== target changed %r => %r' % (from_text, to_text)

762

else:

763

if not reverse:

764

print >>output_to, '=== target was %r' % self.symlink_target

765

else:

766

print >>output_to, '=== target is %r' % self.symlink_target

767

768

def __init__(self, file_id, name, parent_id):

769

super(InventoryLink, self).__init__(file_id, name, parent_id)

770

self.kind = 'symlink'

771

772

def kind_character(self):

773

"""See InventoryEntry.kind_character."""

774

return ''

775

776

def _put_in_tar(self, item, tree):

777

"""See InventoryEntry._put_in_tar."""

778

item.type = tarfile.SYMTYPE

779

fileobj = None

780

item.size = 0

781

item.mode = 0755

782

item.linkname = self.symlink_target

783

return fileobj

784

785

def _put_on_disk(self, fullpath, tree):

786

"""See InventoryEntry._put_on_disk."""

787

try:

788

os.symlink(self.symlink_target, fullpath)

789

except OSError,e:

790

raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))

791

792

def _read_tree_state(self, path, work_tree):

793

"""See InventoryEntry._read_tree_state."""

794

self.symlink_target = work_tree.get_symlink_target(self.file_id)

795

796

def _forget_tree_state(self):

797

self.symlink_target = None

798

799

def _unchanged(self, previous_ie):

800

"""See InventoryEntry._unchanged."""

801

compatible = super(InventoryLink, self)._unchanged(previous_ie)

802

if self.symlink_target != previous_ie.symlink_target:

803

compatible = False

804

return compatible

805

806

def _snapshot_text(self, file_parents, work_tree, commit_builder):

807

"""See InventoryEntry._snapshot_text."""

808

commit_builder.modified_link(

809

self.file_id, file_parents, self.symlink_target)

810

811

812

class Inventory(object):

221

return cmp(self.file_id, other.file_id) \

222

or cmp(self.children, other.children)

223

224

225

226

class Inventory(XMLMixin):

813

227

"""Inventory of versioned files in a tree.

814

228

815

This describes which file_id is present at each point in the tree,

816

and possibly the SHA-1 or other information about the file.

817

Entries can be looked up either by path or by file_id.

229

An Inventory acts like a set of InventoryEntry items. You can

230

also look files up by their file_id or name.

231

232

May be read from and written to a metadata file in a tree. To

233

manipulate the inventory (for example to add a file), it is read

234

in, modified, and then written back out.

818

235

819

236

The inventory represents a typical unix file tree, with

820

237

directories containing files and subdirectories. We never store

827

244

inserted, other than through the Inventory API.

828

245

829

246

>>> inv = Inventory()

830

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

831

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

247

>>> inv.write_xml(sys.stdout)

248

249

</inventory>

250

>>> inv.add(InventoryEntry('123-123', 'hello.c'))

832

251

>>> inv['123-123'].name

833

252

'hello.c'

834

253

842

261

May also look up by name:

843

262

844

263

>>> [x[0] for x in inv.iter_entries()]

845

['', u'hello.c']

846

>>> inv = Inventory('TREE_ROOT-12345678-12345678')

847

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

848

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT-12345678-12345678', sha1=None, len=None)

264

['hello.c']

265

266

>>> inv.write_xml(sys.stdout)

267

268

269

</inventory>

270

849

271

"""

850

def __init__(self, root_id=ROOT_ID, revision_id=None):

272

273

## TODO: Make sure only canonical filenames are stored.

274

275

## TODO: Do something sensible about the possible collisions on

276

## case-losing filesystems. Perhaps we should just always forbid

277

## such collisions.

278

279

## TODO: No special cases for root, rather just give it a file id

280

## like everything else.

281

282

## TODO: Probably change XML serialization to use nesting

283

284

def __init__(self):

851

285

"""Create or read an inventory.

852

286

853

287

If a working directory is specified, the inventory is read

857

291

The inventory is created with a default root directory, with

858

292

an id of None.

859

293

"""

860

# We are letting Branch.create() create a unique inventory

861

# root id. Rather than generating a random one here.

862

#if root_id is None:

863

# root_id = bzrlib.branch.gen_file_id('TREE_ROOT')

864

self.root = RootEntry(root_id)

865

# FIXME: this isn't ever used, changing it to self.revision may break

866

# things. TODO make everything use self.revision_id

867

self.revision_id = revision_id

868

self._byid = {self.root.file_id: self.root}

294

self.root = RootEntry(None)

295

self._byid = {None: self.root}

869

296

870

def copy(self):

871

# TODO: jam 20051218 Should copy also copy the revision_id?

872

entries = self.iter_entries()

873

other = Inventory(entries.next()[1].file_id)

874

# copy recursively so we know directories will be added before

875

# their children. There are more efficient ways than this...

876

for path, entry in entries():

877

other.add(entry.copy())

878

return other

879

297

880

298

def __iter__(self):

881

299

return iter(self._byid)

882

300

301

883

302

def __len__(self):

884

303

"""Returns number of entries."""

885

304

return len(self._byid)

886

305

306

887

307

def iter_entries(self, from_dir=None):

888

308

"""Return (path, entry) pairs, in order by name."""

889

if from_dir is None:

890

assert self.root

891

from_dir = self.root

892

yield '', self.root

893

elif isinstance(from_dir, basestring):

894

from_dir = self._byid[from_dir]

895

896

# unrolling the recursive called changed the time from

897

# 440ms/663ms (inline/total) to 116ms/116ms

898

children = from_dir.children.items()

899

children.sort()

900

children = collections.deque(children)

901

stack = [(u'', children)]

902

while stack:

903

from_dir_relpath, children = stack[-1]

904

905

while children:

906

name, ie = children.popleft()

907

908

# we know that from_dir_relpath never ends in a slash

909

# and 'f' doesn't begin with one, we can do a string op, rather

910

# than the checks of pathjoin(), though this means that all paths

911

# start with a slash

912

path = from_dir_relpath + '/' + name

913

914

yield path[1:], ie

915

916

if ie.kind != 'directory':

917

continue

918

919

# But do this child first

920

new_children = ie.children.items()

921

new_children.sort()

922

new_children = collections.deque(new_children)

923

stack.append((path, new_children))

924

# Break out of inner loop, so that we start outer loop with child

925

break

926

else:

927

# if we finished all children, pop it off the stack

928

stack.pop()

929

930

def iter_entries_by_dir(self, from_dir=None):

931

"""Iterate over the entries in a directory first order.

932

933

This returns all entries for a directory before returning

934

the entries for children of a directory. This is not

935

lexicographically sorted order, and is a hybrid between

936

depth-first and breadth-first.

937

938

:return: This yields (path, entry) pairs

939

"""

940

# TODO? Perhaps this should return the from_dir so that the root is

941

# yielded? or maybe an option?

942

if from_dir is None:

943

assert self.root

944

from_dir = self.root

945

yield '', self.root

946

elif isinstance(from_dir, basestring):

947

from_dir = self._byid[from_dir]

948

949

stack = [(u'', from_dir)]

950

while stack:

951

cur_relpath, cur_dir = stack.pop()

952

953

child_dirs = []

954

for child_name, child_ie in sorted(cur_dir.children.iteritems()):

955

956

child_relpath = cur_relpath + child_name

957

958

yield child_relpath, child_ie

959

960

if child_ie.kind == 'directory':

961

child_dirs.append((child_relpath+'/', child_ie))

962

stack.extend(reversed(child_dirs))

963

964

def entries(self):

965

"""Return list of (path, ie) for all entries except the root.

966

967

This may be faster than iter_entries.

968

"""

969

accum = []

970

def descend(dir_ie, dir_path):

971

kids = dir_ie.children.items()

972

kids.sort()

973

for name, ie in kids:

974

child_path = pathjoin(dir_path, name)

975

accum.append((child_path, ie))

309

if from_dir == None:

310

assert self.root

311

from_dir = self.root

312

elif isinstance(from_dir, basestring):

313

from_dir = self._byid[from_dir]

314

315

kids = from_dir.children.items()

316

kids.sort()

317

for name, ie in kids:

318

yield name, ie

319

if ie.kind == 'directory':

320

for cn, cie in self.iter_entries(from_dir=ie.file_id):

321

yield '/'.join((name, cn)), cie

322

323

324

325

def directories(self, from_dir=None):

326

"""Return (path, entry) pairs for all directories.

327

"""

328

def descend(parent_ie):

329

parent_name = parent_ie.name

330

yield parent_name, parent_ie

331

332

# directory children in sorted order

333

dn = []

334

for ie in parent_ie.children.itervalues():

976

335

if ie.kind == 'directory':

977

descend(ie, child_path)

978

979

descend(self.root, u'')

980

return accum

981

982

def directories(self):

983

"""Return (path, entry) pairs for all directories, including the root.

984

"""

985

accum = []

986

def descend(parent_ie, parent_path):

987

accum.append((parent_path, parent_ie))

336

dn.append((ie.name, ie))

337

dn.sort()

988

338

989

kids = [(ie.name, ie) for ie in parent_ie.children.itervalues() if ie.kind == 'directory']

990

kids.sort()

339

for name, child_ie in dn:

340

for sub_name, sub_ie in descend(child_ie):

341

yield appendpath(parent_name, sub_name), sub_ie

991

342

992

for name, child_ie in kids:

993

child_path = pathjoin(parent_path, name)

994

descend(child_ie, child_path)

995

descend(self.root, u'')

996

return accum

343

for name, ie in descend(self.root):

344

yield name, ie

997

345

346

347

998

348

def __contains__(self, file_id):

999

349

"""True if this entry contains a file with given id.

1000

350

1001

351

>>> inv = Inventory()

1002

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1003

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

352

>>> inv.add(InventoryEntry('123', 'foo.c'))

1004

353

>>> '123' in inv

1005

354

True

1006

355

>>> '456' in inv

1008

357

"""

1009

358

return file_id in self._byid

1010

359

360

1011

361

def __getitem__(self, file_id):

1012

362

"""Return the entry for given file_id.

1013

363

1014

364

>>> inv = Inventory()

1015

>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))

1016

InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

365

>>> inv.add(InventoryEntry('123123', 'hello.c'))

1017

366

>>> inv['123123'].name

1018

367

'hello.c'

1019

368

"""

1020

try:

1021

return self._byid[file_id]

1022

except KeyError:

1023

if file_id is None:

1024

raise BzrError("can't look up file_id None")

1025

else:

1026

raise BzrError("file_id {%s} not in inventory" % file_id)

369

return self._byid[file_id]

1027

370

1028

def get_file_kind(self, file_id):

1029

return self._byid[file_id].kind

1030

371

1031

372

def get_child(self, parent_id, filename):

1032

373

return self[parent_id].children.get(filename)

1033

374

375

1034

376

def add(self, entry):

1035

377

"""Add entry to inventory.

1036

378

1037

379

To add a file to a branch ready to be committed, use Branch.add,

1038

which calls this.

1039

1040

Returns the new entry object.

1041

"""

380

which calls this."""

1042

381

if entry.file_id in self._byid:

1043

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

1044

1045

if entry.parent_id == ROOT_ID or entry.parent_id is None:

1046

entry.parent_id = self.root.file_id

382

bailout("inventory already contains entry with id {%s}" % entry.file_id)

1047

383

1048

384

try:

1049

385

parent = self._byid[entry.parent_id]

1050

386

except KeyError:

1051

raise BzrError("parent_id {%s} not in inventory" % entry.parent_id)

387

bailout("parent_id %r not in inventory" % entry.parent_id)

1052

388

1053

if entry.name in parent.children:

1054

raise BzrError("%s is already versioned" %

1055

pathjoin(self.id2path(parent.file_id), entry.name))

389

if parent.children.has_key(entry.name):

390

bailout("%s is already versioned" %

391

appendpath(self.id2path(parent.file_id), entry.name))

1056

392

1057

393

self._byid[entry.file_id] = entry

1058

394

parent.children[entry.name] = entry

1059

return entry

1060

1061

def add_path(self, relpath, kind, file_id=None, parent_id=None):

395

396

397

def add_path(self, relpath, kind, file_id=None):

1062

398

"""Add entry from a path.

1063

399

1064

The immediate parent must already be versioned.

1065

1066

Returns the new entry object."""

1067

1068

parts = osutils.splitpath(relpath)

1069

400

The immediate parent must already be versioned"""

401

parts = bzrlib.osutils.splitpath(relpath)

1070

402

if len(parts) == 0:

1071

if file_id is None:

1072

file_id = bzrlib.workingtree.gen_root_id()

1073

self.root = RootEntry(file_id)

1074

self._byid = {self.root.file_id: self.root}

1075

return

1076

else:

1077

parent_path = parts[:-1]

1078

parent_id = self.path2id(parent_path)

1079

if parent_id is None:

1080

raise NotVersionedError(path=parent_path)

1081

ie = make_entry(kind, parts[-1], parent_id, file_id)

403

bailout("cannot re-add root of inventory")

404

405

if file_id is None:

406

file_id = bzrlib.branch.gen_file_id(relpath)

407

408

parent_id = self.path2id(parts[:-1])

409

ie = InventoryEntry(file_id, parts[-1],

410

kind=kind, parent_id=parent_id)

1082

411

return self.add(ie)

1083

412

413

1084

414

def __delitem__(self, file_id):

1085

415

"""Remove entry by id.

1086

416

1087

417

>>> inv = Inventory()

1088

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1089

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

418

>>> inv.add(InventoryEntry('123', 'foo.c'))

1090

419

>>> '123' in inv

1091

420

True

1092

421

>>> del inv['123']

1095

424

"""

1096

425

ie = self[file_id]

1097

426

1098

assert ie.parent_id is None or \

1099

self[ie.parent_id].children[ie.name] == ie

427

assert self[ie.parent_id].children[ie.name] == ie

1100

428

429

# TODO: Test deleting all children; maybe hoist to a separate

430

# deltree method?

431

if ie.kind == 'directory':

432

for cie in ie.children.values():

433

del self[cie.file_id]

434

del ie.children

435

1101

436

del self._byid[file_id]

1102

if ie.parent_id is not None:

1103

del self[ie.parent_id].children[ie.name]

1104

1105

def __eq__(self, other):

437

del self[ie.parent_id].children[ie.name]

438

439

440

def id_set(self):

441

return Set(self._byid)

442

443

444

def to_element(self):

445

"""Convert to XML Element"""

446

e = Element('inventory')

447

e.text = '\n'

448

for path, ie in self.iter_entries():

449

e.append(ie.to_element())

450

return e

451

452

453

def from_element(cls, elt):

454

"""Construct from XML Element

455

456

>>> inv = Inventory()

457

>>> inv.add(InventoryEntry('foo.c-123981239', 'foo.c'))

458

>>> elt = inv.to_element()

459

>>> inv2 = Inventory.from_element(elt)

460

>>> inv2 == inv

461

True

462

"""

463

assert elt.tag == 'inventory'

464

o = cls()

465

for e in elt:

466

o.add(InventoryEntry.from_element(e))

467

return o

468

469

from_element = classmethod(from_element)

470

471

472

def __cmp__(self, other):

1106

473

"""Compare two sets by comparing their contents.

1107

474

1108

475

>>> i1 = Inventory()

1109

476

>>> i2 = Inventory()

1110

477

>>> i1 == i2

1111

478

True

1112

>>> i1.add(InventoryFile('123', 'foo', ROOT_ID))

1113

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

479

>>> i1.add(InventoryEntry('123', 'foo'))

1114

480

>>> i1 == i2

1115

481

False

1116

>>> i2.add(InventoryFile('123', 'foo', ROOT_ID))

1117

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

482

>>> i2.add(InventoryEntry('123', 'foo'))

1118

483

>>> i1 == i2

1119

484

True

1120

485

"""

486

if self is other:

487

return 0

488

1121

489

if not isinstance(other, Inventory):

1122

490

return NotImplemented

1123

491

1124

return self._byid == other._byid

1125

1126

def __ne__(self, other):

1127

return not self.__eq__(other)

1128

1129

def __hash__(self):

1130

raise ValueError('not hashable')

1131

1132

def _iter_file_id_parents(self, file_id):

1133

"""Yield the parents of file_id up to the root."""

1134

while file_id is not None:

1135

try:

1136

ie = self._byid[file_id]

1137

except KeyError:

1138

raise BzrError("file_id {%s} not found in inventory" % file_id)

1139

yield ie

492

if self.id_set() ^ other.id_set():

493

return 1

494

495

for file_id in self._byid:

496

c = cmp(self[file_id], other[file_id])

497

if c: return c

498

499

return 0

500

501

502

def id2path(self, file_id):

503

"""Return as a list the path to file_id."""

504

p = []

505

while file_id != None:

506

ie = self._byid[file_id]

507

p.insert(0, ie.name)

1140

508

file_id = ie.parent_id

1141

1142

def get_idpath(self, file_id):

1143

"""Return a list of file_ids for the path to an entry.

1144

1145

The list contains one element for each directory followed by

1146

the id of the file itself. So the length of the returned list

1147

is equal to the depth of the file in the tree, counting the

1148

root directory as depth 1.

1149

"""

1150

p = []

1151

for parent in self._iter_file_id_parents(file_id):

1152

p.insert(0, parent.file_id)

1153

return p

1154

1155

def id2path(self, file_id):

1156

"""Return as a string the path to file_id.

1157

1158

>>> i = Inventory()

1159

>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))

1160

>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))

1161

>>> print i.id2path('foo-id')

1162

src/foo.c

1163

"""

1164

# get all names, skipping root

1165

return '/'.join(reversed(

1166

[parent.name for parent in

1167

self._iter_file_id_parents(file_id)][:-1]))

509

return '/'.join(p)

1168

510

511

512

1169

513

def path2id(self, name):

1170

514

"""Walk down through directories to return entry of last component.

1171

515

1174

518

1175

519

This returns the entry of the last component in the path,

1176

520

which may be either a file or a directory.

1177

1178

Returns None IFF the path is not found.

1179

521

"""

1180

522

if isinstance(name, types.StringTypes):

1181

523

name = splitpath(name)

1182

524

1183

# mutter("lookup path %r" % name)

1184

1185

parent = self.root

525

parent = self[None]

1186

526

for f in name:

1187

527

try:

1188

528

cie = parent.children[f]

1189

529

assert cie.name == f

1190

assert cie.parent_id == parent.file_id

1191

530

parent = cie

1192

531

except KeyError:

1193

532

# or raise an error?

1195

534

1196

535

return parent.file_id

1197

536

537

1198

538

def has_filename(self, names):

1199

539

return bool(self.path2id(names))

1200

540

541

1201

542

def has_id(self, file_id):

1202

543

return self._byid.has_key(file_id)

1203

544

545

1204

546

def rename(self, file_id, new_parent_id, new_name):

1205

547

"""Move a file within the inventory.

1206

548

1208

550

1209

551

This does not move the working file."""

1210

552

if not is_valid_name(new_name):

1211

raise BzrError("not an acceptable filename: %r" % new_name)

553

bailout("not an acceptable filename: %r" % new_name)

1212

554

1213

555

new_parent = self._byid[new_parent_id]

1214

556

if new_name in new_parent.children:

1215

raise BzrError("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

1216

1217

new_parent_idpath = self.get_idpath(new_parent_id)

1218

if file_id in new_parent_idpath:

1219

raise BzrError("cannot move directory %r into a subdirectory of itself, %r"

1220

% (self.id2path(file_id), self.id2path(new_parent_id)))

557

bailout("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

1221

558

1222

559

file_ie = self._byid[file_id]

1223

560

old_parent = self._byid[file_ie.parent_id]

1231

568

file_ie.parent_id = new_parent_id

1232

569

1233

570

1234

def make_entry(kind, name, parent_id, file_id=None):

1235

"""Create an inventory entry.

1236

1237

:param kind: the type of inventory entry to create.

1238

:param name: the basename of the entry.

1239

:param parent_id: the parent_id of the entry.

1240

:param file_id: the file_id to use. if None, one will be created.

1241

"""

1242

if file_id is None:

1243

file_id = bzrlib.workingtree.gen_file_id(name)

1244

1245

norm_name, can_access = osutils.normalized_filename(name)

1246

if norm_name != name:

1247

if can_access:

1248

name = norm_name

1249

else:

1250

# TODO: jam 20060701 This would probably be more useful

1251

# if the error was raised with the full path

1252

raise errors.InvalidNormalization(name)

1253

1254

if kind == 'directory':

1255

return InventoryDirectory(file_id, name, parent_id)

1256

elif kind == 'file':

1257

return InventoryFile(file_id, name, parent_id)

1258

elif kind == 'symlink':

1259

return InventoryLink(file_id, name, parent_id)

1260

else:

1261

raise BzrError("unknown kind %r" % kind)

1262

1263

1264

_NAME_RE = None

571

572

573

_NAME_RE = re.compile(r'^[^/\\]+$')

1265

574

1266

575

def is_valid_name(name):

1267

global _NAME_RE

1268

if _NAME_RE is None:

1269

_NAME_RE = re.compile(r'^[^/\\]+$')

1270

1271

576

return bool(_NAME_RE.match(name))

577

578

579

580

if __name__ == '__main__':

581

import doctest, inventory

582

doctest.testmod(inventory)

Older »