~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: Martin Pool
Date: 2005-06-20 04:24:35 UTC
Revision ID: mbp@sourcefrog.net-20050620042435-7c315b5a93001b89

- add jk's patchwork client

files added:
bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/statcache.py

bzrlib/upgrade.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/new-inventory-sample.xml

notes/performance.txt

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

files removed:
BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS.developers

bzrlib/annotate.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/read_bundle.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v07.py

bzrlib/bzrdir.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/identitymap.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/emacs

contrib/emacs/bzr-mode.el

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

generate_docs.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

files renamed:
tools/doc_generate/autodoc_man.py => bzr-man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/tests/__init__.py => bzrlib/selftest.py

bzrlib/store/__init__.py => bzrlib/store.py

bzrlib/tests/test_whitebox.py => bzrlib/whitebox.py

bzrlib/xml_serializer.py => bzrlib/xml.py

bzrlib/util/elementtree/ => elementtree/

bzrlib/util/urlgrabber/ => urlgrabber/

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/workingtree.py

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh/_bzr

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: This refactoring of the workingtree code doesn't seem to keep

# the WorkingTree's copy of the inventory in sync with the branch. The

# branch modifies its working inventory when it does a commit to make

# missing files permanently removed.

# TODO: Maybe also keep the full path of the entry, and the children?

# But those depend on its position within a particular inventory, and

# it would be nice not to need to hold the backpointer here.

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import collections

import os.path

import re

import sys

import tarfile

import types

import sys, os.path, types, re

try:

from cElementTree import Element, ElementTree, SubElement

except ImportError:

from elementtree.ElementTree import Element, ElementTree, SubElement

from bzrlib.xml import XMLMixin

from bzrlib.errors import BzrError, BzrCheckError

import bzrlib

from bzrlib.osutils import (pumpfile, quotefn, splitpath, joinpath,

pathjoin, sha_strings)

from bzrlib.errors import (NotVersionedError, InvalidEntryName,

BzrError, BzrCheckError, BinaryFile)

from bzrlib.osutils import uuid, quotefn, splitpath, joinpath, appendpath

from bzrlib.trace import mutter

class InventoryEntry(object):

class InventoryEntry(XMLMixin):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

file_id

name

(within the parent directory)

parent_id

file_id of the parent directory, or ROOT_ID

revision

the revision_id in which this variation of this file was

introduced.

executable

Indicates that this file should be executable on systems

that support it.

text_sha1

sha-1 of the text of the file

text_size

size in bytes of the text of the file

(reading a version 4 tree created a text_id field.)

* *file_id*

* *name*: (only the basename within the directory, must not

contain slashes)

* *kind*: "directory" or "file"

* *directory_id*: (if absent/null means the branch root directory)

* *text_sha1*: only for files

* *text_size*: in bytes, only for files

* *text_id*: identifier for the text version, only for files

InventoryEntries can also exist inside a WorkingTree

inventory, in which case they are not yet bound to a

particular revision of the file. In that case the text_sha1,

text_size and text_id are absent.

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))

InventoryDirectory('123', 'src', parent_id='TREE_ROOT')

>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))

InventoryFile('2323', 'hello.c', parent_id='123')

>>> shouldbe = {0: 'src', 1: pathjoin('src','hello.c')}

>>> for ix, j in enumerate(i.iter_entries()):

... print (j[0] == shouldbe[ix], j[1])

>>> i.add(InventoryEntry('123', 'src', 'directory', ROOT_ID))

>>> i.add(InventoryEntry('2323', 'hello.c', 'file', parent_id='123'))

>>> for j in i.iter_entries():

... print j

...

(True, InventoryDirectory('123', 'src', parent_id='TREE_ROOT'))

(True, InventoryFile('2323', 'hello.c', parent_id='123'))

>>> i.add(InventoryFile('2323', 'bye.c', '123'))

('src', InventoryEntry('123', 'src', kind='directory', parent_id='TREE_ROOT'))

('src/hello.c', InventoryEntry('2323', 'hello.c', kind='file', parent_id='123'))

>>> i.add(InventoryEntry('2323', 'bye.c', 'file', '123'))

Traceback (most recent call last):

...

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryFile('2324', 'bye.c', '123'))

InventoryFile('2324', 'bye.c', parent_id='123')

>>> i.add(InventoryDirectory('2325', 'wibble', '123'))

InventoryDirectory('2325', 'wibble', parent_id='123')

>>> i.add(InventoryEntry('2324', 'bye.c', 'file', '123'))

>>> i.add(InventoryEntry('2325', 'wibble', 'directory', '123'))

>>> i.path2id('src/wibble')

'2325'

>>> '2325' in i

100

True

101

>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))

102

InventoryFile('2326', 'wibble.c', parent_id='2325')

>>> i.add(InventoryEntry('2326', 'wibble.c', 'file', '2325'))

103

>>> i['2326']

104

InventoryFile('2326', 'wibble.c', parent_id='2325')

105

>>> for path, entry in i.iter_entries():

106

... print path

107

... assert i.path2id(path)

InventoryEntry('2326', 'wibble.c', kind='file', parent_id='2325')

>>> for j in i.iter_entries():

... print j[0]

... assert i.path2id(j[0])

108

...

109

src

110

src/bye.c

113

src/wibble/wibble.c

114

>>> i.id2path('2326')

115

'src/wibble/wibble.c'

TODO: Maybe also keep the full path of the entry, and the children?

But those depend on its position within a particular inventory, and

it would be nice not to need to hold the backpointer here.

116

"""

117

118

# Constants returned by describe_change()

119

120

# TODO: These should probably move to some kind of FileChangeDescription

121

# class; that's like what's inside a TreeDelta but we want to be able to

122

# generate them just for one file at a time.

123

RENAMED = 'renamed'

124

MODIFIED_AND_RENAMED = 'modified and renamed'

# TODO: split InventoryEntry into subclasses for files,

# directories, etc etc.

100

101

text_sha1 = None

102

text_size = None

125

103

126

__slots__ = []

127

128

def detect_changes(self, old_entry):

129

"""Return a (text_modified, meta_modified) from this to old_entry.

130

131

_read_tree_state must have been called on self and old_entry prior to

132

calling detect_changes.

133

"""

134

return False, False

135

136

def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

137

output_to, reverse=False):

138

"""Perform a diff from this to to_entry.

139

140

text_diff will be used for textual difference calculation.

141

This is a template method, override _diff in child classes.

142

"""

143

self._read_tree_state(tree.id2path(self.file_id), tree)

144

if to_entry:

145

# cannot diff from one kind to another - you must do a removal

146

# and an addif they do not match.

147

assert self.kind == to_entry.kind

148

to_entry._read_tree_state(to_tree.id2path(to_entry.file_id),

149

to_tree)

150

self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,

151

output_to, reverse)

152

153

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

154

output_to, reverse=False):

155

"""Perform a diff between two entries of the same kind."""

156

157

def find_previous_heads(self, previous_inventories,

158

versioned_file_store,

159

transaction,

160

entry_vf=None):

161

"""Return the revisions and entries that directly precede this.

162

163

Returned as a map from revision to inventory entry.

164

165

This is a map containing the file revisions in all parents

166

for which the file exists, and its revision is not a parent of

167

any other. If the file is new, the set will be empty.

168

169

:param versioned_file_store: A store where ancestry data on this

170

file id can be queried.

171

:param transaction: The transaction that queries to the versioned

172

file store should be completed under.

173

:param entry_vf: The entry versioned file, if its already available.

174

"""

175

def get_ancestors(weave, entry):

176

return set(weave.get_ancestry(entry.revision))

177

# revision:ie mapping for each ie found in previous_inventories.

178

candidates = {}

179

# revision:ie mapping with one revision for each head.

180

heads = {}

181

# revision: ancestor list for each head

182

head_ancestors = {}

183

# identify candidate head revision ids.

184

for inv in previous_inventories:

185

if self.file_id in inv:

186

ie = inv[self.file_id]

187

assert ie.file_id == self.file_id

188

if ie.revision in candidates:

189

# same revision value in two different inventories:

190

# correct possible inconsistencies:

191

# * there was a bug in revision updates with 'x' bit

192

# support.

193

try:

194

if candidates[ie.revision].executable != ie.executable:

195

candidates[ie.revision].executable = False

196

ie.executable = False

197

except AttributeError:

198

pass

199

# must now be the same.

200

assert candidates[ie.revision] == ie

201

else:

202

# add this revision as a candidate.

203

candidates[ie.revision] = ie

204

205

# common case optimisation

206

if len(candidates) == 1:

207

# if there is only one candidate revision found

208

# then we can opening the versioned file to access ancestry:

209

# there cannot be any ancestors to eliminate when there is

210

# only one revision available.

211

heads[ie.revision] = ie

212

return heads

213

214

# eliminate ancestors amongst the available candidates:

215

# heads are those that are not an ancestor of any other candidate

216

# - this provides convergence at a per-file level.

217

for ie in candidates.values():

218

# may be an ancestor of a known head:

219

already_present = 0 != len(

220

[head for head in heads

221

if ie.revision in head_ancestors[head]])

222

if already_present:

223

# an ancestor of an analyzed candidate.

224

continue

225

# not an ancestor of a known head:

226

# load the versioned file for this file id if needed

227

if entry_vf is None:

228

entry_vf = versioned_file_store.get_weave_or_empty(

229

self.file_id, transaction)

230

ancestors = get_ancestors(entry_vf, ie)

231

# may knock something else out:

232

check_heads = list(heads.keys())

233

for head in check_heads:

234

if head in ancestors:

235

# this previously discovered 'head' is not

236

# really a head - its an ancestor of the newly

237

# found head,

238

heads.pop(head)

239

head_ancestors[ie.revision] = ancestors

240

heads[ie.revision] = ie

241

return heads

242

243

def get_tar_item(self, root, dp, now, tree):

244

"""Get a tarfile item and a file stream for its content."""

245

item = tarfile.TarInfo(pathjoin(root, dp))

246

# TODO: would be cool to actually set it to the timestamp of the

247

# revision it was last changed

248

item.mtime = now

249

fileobj = self._put_in_tar(item, tree)

250

return item, fileobj

251

252

def has_text(self):

253

"""Return true if the object this entry represents has textual data.

254

255

Note that textual data includes binary content.

256

257

Also note that all entries get weave files created for them.

258

This attribute is primarily used when upgrading from old trees that

259

did not have the weave index for all inventory entries.

260

"""

261

return False

262

263

def __init__(self, file_id, name, parent_id, text_id=None):

104

def __init__(self, file_id, name, kind, parent_id, text_id=None):

264

105

"""Create an InventoryEntry

265

106

266

107

The filename must be a single component, relative to the

267

108

parent directory; it cannot be a whole path or relative name.

268

109

269

>>> e = InventoryFile('123', 'hello.c', ROOT_ID)

110

>>> e = InventoryEntry('123', 'hello.c', 'file', ROOT_ID)

270

111

>>> e.name

271

112

'hello.c'

272

113

>>> e.file_id

273

114

'123'

274

>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)

115

>>> e = InventoryEntry('123', 'src/hello.c', 'file', ROOT_ID)

275

116

Traceback (most recent call last):

276

InvalidEntryName: Invalid entry name: src/hello.c

117

BzrCheckError: InventoryEntry name 'src/hello.c' is invalid

277

118

"""

278

assert isinstance(name, basestring), name

279

119

if '/' in name or '\\' in name:

280

raise InvalidEntryName(name=name)

281

self.executable = False

282

self.revision = None

283

self.text_sha1 = None

284

self.text_size = None

120

raise BzrCheckError('InventoryEntry name %r is invalid' % name)

121

285

122

self.file_id = file_id

286

123

self.name = name

124

self.kind = kind

287

125

self.text_id = text_id

288

126

self.parent_id = parent_id

289

self.symlink_target = None

290

291

def kind_character(self):

292

"""Return a short kind indicator useful for appending to names."""

293

raise BzrError('unknown kind %r' % self.kind)

294

295

known_kinds = ('file', 'directory', 'symlink', 'root_directory')

296

297

def _put_in_tar(self, item, tree):

298

"""populate item for stashing in a tar, and return the content stream.

299

300

If no content is available, return None.

301

"""

302

raise BzrError("don't know how to export {%s} of kind %r" %

303

(self.file_id, self.kind))

304

305

def put_on_disk(self, dest, dp, tree):

306

"""Create a representation of self on disk in the prefix dest.

307

308

This is a template method - implement _put_on_disk in subclasses.

309

"""

310

fullpath = pathjoin(dest, dp)

311

self._put_on_disk(fullpath, tree)

312

mutter(" export {%s} kind %s to %s", self.file_id,

313

self.kind, fullpath)

314

315

def _put_on_disk(self, fullpath, tree):

316

"""Put this entry onto disk at fullpath, from tree tree."""

317

raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))

127

if kind == 'directory':

128

self.children = {}

129

elif kind == 'file':

130

pass

131

else:

132

raise BzrError("unhandled entry kind %r" % kind)

133

134

318

135

319

136

def sorted_children(self):

320

return sorted(self.children.items())

321

322

@staticmethod

323

def versionable_kind(kind):

324

return kind in ('file', 'directory', 'symlink')

325

326

def check(self, checker, rev_id, inv, tree):

327

"""Check this inventory entry is intact.

328

329

This is a template method, override _check for kind specific

330

tests.

331

332

:param checker: Check object providing context for the checks;

333

can be used to find out what parts of the repository have already

334

been checked.

335

:param rev_id: Revision id from which this InventoryEntry was loaded.

336

Not necessarily the last-changed revision for this file.

337

:param inv: Inventory from which the entry was loaded.

338

:param tree: RevisionTree for this entry.

339

"""

340

if self.parent_id is not None:

341

if not inv.has_id(self.parent_id):

342

raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'

343

% (self.parent_id, rev_id))

344

self._check(checker, rev_id, tree)

345

346

def _check(self, checker, rev_id, tree):

347

"""Check this inventory entry for kind specific errors."""

348

raise BzrCheckError('unknown entry kind %r in revision {%s}' %

349

(self.kind, rev_id))

137

l = self.children.items()

138

l.sort()

139

return l

140

350

141

351

142

def copy(self):

352

"""Clone this inventory entry."""

353

raise NotImplementedError

354

355

@staticmethod

356

def describe_change(old_entry, new_entry):

357

"""Describe the change between old_entry and this.

358

359

This smells of being an InterInventoryEntry situation, but as its

360

the first one, we're making it a static method for now.

361

362

An entry with a different parent, or different name is considered

363

to be renamed. Reparenting is an internal detail.

364

Note that renaming the parent does not trigger a rename for the

365

child entry itself.

366

"""

367

# TODO: Perhaps return an object rather than just a string

368

if old_entry is new_entry:

369

# also the case of both being None

370

return 'unchanged'

371

elif old_entry is None:

372

return 'added'

373

elif new_entry is None:

374

return 'removed'

375

text_modified, meta_modified = new_entry.detect_changes(old_entry)

376

if text_modified or meta_modified:

377

modified = True

378

else:

379

modified = False

380

# TODO 20060511 (mbp, rbc) factor out 'detect_rename' here.

381

if old_entry.parent_id != new_entry.parent_id:

382

renamed = True

383

elif old_entry.name != new_entry.name:

384

renamed = True

385

else:

386

renamed = False

387

if renamed and not modified:

388

return InventoryEntry.RENAMED

389

if modified and not renamed:

390

return 'modified'

391

if modified and renamed:

392

return InventoryEntry.MODIFIED_AND_RENAMED

393

return 'unchanged'

143

other = InventoryEntry(self.file_id, self.name, self.kind,

144

self.parent_id, text_id=self.text_id)

145

other.text_sha1 = self.text_sha1

146

other.text_size = self.text_size

147

# note that children are *not* copied; they're pulled across when

148

# others are added

149

return other

150

394

151

395

152

def __repr__(self):

396

return ("%s(%r, %r, parent_id=%r)"

153

return ("%s(%r, %r, kind=%r, parent_id=%r)"

397

154

% (self.__class__.__name__,

398

155

self.file_id,

399

156

self.name,

157

self.kind,

400

158

self.parent_id))

401

159

402

def snapshot(self, revision, path, previous_entries,

403

work_tree, commit_builder):

404

"""Make a snapshot of this entry which may or may not have changed.

405

406

This means that all its fields are populated, that it has its

407

text stored in the text store or weave.

408

"""

409

mutter('new parents of %s are %r', path, previous_entries)

410

self._read_tree_state(path, work_tree)

411

# TODO: Where should we determine whether to reuse a

412

# previous revision id or create a new revision? 20060606

413

if len(previous_entries) == 1:

414

# cannot be unchanged unless there is only one parent file rev.

415

parent_ie = previous_entries.values()[0]

416

if self._unchanged(parent_ie):

417

mutter("found unchanged entry")

418

self.revision = parent_ie.revision

419

return "unchanged"

420

return self._snapshot_into_revision(revision, previous_entries,

421

work_tree, commit_builder)

422

423

def _snapshot_into_revision(self, revision, previous_entries, work_tree,

424

commit_builder):

425

"""Record this revision unconditionally into a store.

426

427

The entry's last-changed revision property (`revision`) is updated to

428

that of the new revision.

429

430

:param revision: id of the new revision that is being recorded.

431

432

:returns: String description of the commit (e.g. "merged", "modified"), etc.

433

"""

434

mutter('new revision {%s} for {%s}', revision, self.file_id)

435

self.revision = revision

436

self._snapshot_text(previous_entries, work_tree, commit_builder)

437

438

def _snapshot_text(self, file_parents, work_tree, commit_builder):

439

"""Record the 'text' of this entry, whatever form that takes.

440

441

This default implementation simply adds an empty text.

442

"""

443

raise NotImplementedError(self._snapshot_text)

160

161

def to_element(self):

162

"""Convert to XML element"""

163

e = Element('entry')

164

165

e.set('name', self.name)

166

e.set('file_id', self.file_id)

167

e.set('kind', self.kind)

168

169

if self.text_size != None:

170

e.set('text_size', '%d' % self.text_size)

171

172

for f in ['text_id', 'text_sha1']:

173

v = getattr(self, f)

174

if v != None:

175

e.set(f, v)

176

177

# to be conservative, we don't externalize the root pointers

178

# for now, leaving them as null in the xml form. in a future

179

# version it will be implied by nested elements.

180

if self.parent_id != ROOT_ID:

181

assert isinstance(self.parent_id, basestring)

182

e.set('parent_id', self.parent_id)

183

184

e.tail = '\n'

185

186

return e

187

188

189

def from_element(cls, elt):

190

assert elt.tag == 'entry'

191

192

## original format inventories don't have a parent_id for

193

## nodes in the root directory, but it's cleaner to use one

194

## internally.

195

parent_id = elt.get('parent_id')

196

if parent_id == None:

197

parent_id = ROOT_ID

198

199

self = cls(elt.get('file_id'), elt.get('name'), elt.get('kind'), parent_id)

200

self.text_id = elt.get('text_id')

201

self.text_sha1 = elt.get('text_sha1')

202

203

## mutter("read inventoryentry: %r" % (elt.attrib))

204

205

v = elt.get('text_size')

206

self.text_size = v and int(v)

207

208

return self

209

210

211

from_element = classmethod(from_element)

444

212

445

213

def __eq__(self, other):

446

214

if not isinstance(other, InventoryEntry):

447

215

return NotImplemented

448

216

449

return ((self.file_id == other.file_id)

450

and (self.name == other.name)

451

and (other.symlink_target == self.symlink_target)

452

and (self.text_sha1 == other.text_sha1)

453

and (self.text_size == other.text_size)

454

and (self.text_id == other.text_id)

455

and (self.parent_id == other.parent_id)

456

and (self.kind == other.kind)

457

and (self.revision == other.revision)

458

and (self.executable == other.executable)

459

)

217

return (self.file_id == other.file_id) \

218

and (self.name == other.name) \

219

and (self.text_sha1 == other.text_sha1) \

220

and (self.text_size == other.text_size) \

221

and (self.text_id == other.text_id) \

222

and (self.parent_id == other.parent_id) \

223

and (self.kind == other.kind)

224

460

225

461

226

def __ne__(self, other):

462

227

return not (self == other)

464

229

def __hash__(self):

465

230

raise ValueError('not hashable')

466

231

467

def _unchanged(self, previous_ie):

468

"""Has this entry changed relative to previous_ie.

469

470

This method should be overridden in child classes.

471

"""

472

compatible = True

473

# different inv parent

474

if previous_ie.parent_id != self.parent_id:

475

compatible = False

476

# renamed

477

elif previous_ie.name != self.name:

478

compatible = False

479

return compatible

480

481

def _read_tree_state(self, path, work_tree):

482

"""Populate fields in the inventory entry from the given tree.

483

484

Note that this should be modified to be a noop on virtual trees

485

as all entries created there are prepopulated.

486

"""

487

# TODO: Rather than running this manually, we should check the

488

# working sha1 and other expensive properties when they're

489

# first requested, or preload them if they're already known

490

pass # nothing to do by default

491

492

def _forget_tree_state(self):

493

pass

494

232

495

233

496

234

class RootEntry(InventoryEntry):

497

498

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

499

'text_id', 'parent_id', 'children', 'executable',

500

'revision', 'symlink_target']

501

502

def _check(self, checker, rev_id, tree):

503

"""See InventoryEntry._check"""

504

505

235

def __init__(self, file_id):

506

236

self.file_id = file_id

507

237

self.children = {}

508

238

self.kind = 'root_directory'

509

239

self.parent_id = None

510

self.name = u''

240

self.name = ''

511

241

512

242

def __eq__(self, other):

513

243

if not isinstance(other, RootEntry):

517

247

and (self.children == other.children)

518

248

519

249

520

class InventoryDirectory(InventoryEntry):

521

"""A directory in an inventory."""

522

523

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

524

'text_id', 'parent_id', 'children', 'executable',

525

'revision', 'symlink_target']

526

527

def _check(self, checker, rev_id, tree):

528

"""See InventoryEntry._check"""

529

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

530

raise BzrCheckError('directory {%s} has text in revision {%s}'

531

% (self.file_id, rev_id))

532

533

def copy(self):

534

other = InventoryDirectory(self.file_id, self.name, self.parent_id)

535

other.revision = self.revision

536

# note that children are *not* copied; they're pulled across when

537

# others are added

538

return other

539

540

def __init__(self, file_id, name, parent_id):

541

super(InventoryDirectory, self).__init__(file_id, name, parent_id)

542

self.children = {}

543

self.kind = 'directory'

544

545

def kind_character(self):

546

"""See InventoryEntry.kind_character."""

547

return '/'

548

549

def _put_in_tar(self, item, tree):

550

"""See InventoryEntry._put_in_tar."""

551

item.type = tarfile.DIRTYPE

552

fileobj = None

553

item.name += '/'

554

item.size = 0

555

item.mode = 0755

556

return fileobj

557

558

def _put_on_disk(self, fullpath, tree):

559

"""See InventoryEntry._put_on_disk."""

560

os.mkdir(fullpath)

561

562

def _snapshot_text(self, file_parents, work_tree, commit_builder):

563

"""See InventoryEntry._snapshot_text."""

564

commit_builder.modified_directory(self.file_id, file_parents)

565

566

567

class InventoryFile(InventoryEntry):

568

"""A file in an inventory."""

569

570

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

571

'text_id', 'parent_id', 'children', 'executable',

572

'revision', 'symlink_target']

573

574

def _check(self, checker, tree_revision_id, tree):

575

"""See InventoryEntry._check"""

576

t = (self.file_id, self.revision)

577

if t in checker.checked_texts:

578

prev_sha = checker.checked_texts[t]

579

if prev_sha != self.text_sha1:

580

raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %

581

(self.file_id, tree_revision_id))

582

else:

583

checker.repeated_text_cnt += 1

584

return

585

586

if self.file_id not in checker.checked_weaves:

587

mutter('check weave {%s}', self.file_id)

588

w = tree.get_weave(self.file_id)

589

# Not passing a progress bar, because it creates a new

590

# progress, which overwrites the current progress,

591

# and doesn't look nice

592

w.check()

593

checker.checked_weaves[self.file_id] = True

594

else:

595

w = tree.get_weave(self.file_id)

596

597

mutter('check version {%s} of {%s}', tree_revision_id, self.file_id)

598

checker.checked_text_cnt += 1

599

# We can't check the length, because Weave doesn't store that

600

# information, and the whole point of looking at the weave's

601

# sha1sum is that we don't have to extract the text.

602

if self.text_sha1 != w.get_sha1(self.revision):

603

raise BzrCheckError('text {%s} version {%s} wrong sha1'

604

% (self.file_id, self.revision))

605

checker.checked_texts[t] = self.text_sha1

606

607

def copy(self):

608

other = InventoryFile(self.file_id, self.name, self.parent_id)

609

other.executable = self.executable

610

other.text_id = self.text_id

611

other.text_sha1 = self.text_sha1

612

other.text_size = self.text_size

613

other.revision = self.revision

614

return other

615

616

def detect_changes(self, old_entry):

617

"""See InventoryEntry.detect_changes."""

618

assert self.text_sha1 is not None

619

assert old_entry.text_sha1 is not None

620

text_modified = (self.text_sha1 != old_entry.text_sha1)

621

meta_modified = (self.executable != old_entry.executable)

622

return text_modified, meta_modified

623

624

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

625

output_to, reverse=False):

626

"""See InventoryEntry._diff."""

627

try:

628

from_text = tree.get_file(self.file_id).readlines()

629

if to_entry:

630

to_text = to_tree.get_file(to_entry.file_id).readlines()

631

else:

632

to_text = []

633

if not reverse:

634

text_diff(from_label, from_text,

635

to_label, to_text, output_to)

636

else:

637

text_diff(to_label, to_text,

638

from_label, from_text, output_to)

639

except BinaryFile:

640

if reverse:

641

label_pair = (to_label, from_label)

642

else:

643

label_pair = (from_label, to_label)

644

print >> output_to, "Binary files %s and %s differ" % label_pair

645

646

def has_text(self):

647

"""See InventoryEntry.has_text."""

648

return True

649

650

def __init__(self, file_id, name, parent_id):

651

super(InventoryFile, self).__init__(file_id, name, parent_id)

652

self.kind = 'file'

653

654

def kind_character(self):

655

"""See InventoryEntry.kind_character."""

656

return ''

657

658

def _put_in_tar(self, item, tree):

659

"""See InventoryEntry._put_in_tar."""

660

item.type = tarfile.REGTYPE

661

fileobj = tree.get_file(self.file_id)

662

item.size = self.text_size

663

if tree.is_executable(self.file_id):

664

item.mode = 0755

665

else:

666

item.mode = 0644

667

return fileobj

668

669

def _put_on_disk(self, fullpath, tree):

670

"""See InventoryEntry._put_on_disk."""

671

pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))

672

if tree.is_executable(self.file_id):

673

os.chmod(fullpath, 0755)

674

675

def _read_tree_state(self, path, work_tree):

676

"""See InventoryEntry._read_tree_state."""

677

self.text_sha1 = work_tree.get_file_sha1(self.file_id, path=path)

678

# FIXME: 20050930 probe for the text size when getting sha1

679

# in _read_tree_state

680

self.executable = work_tree.is_executable(self.file_id, path=path)

681

682

def _forget_tree_state(self):

683

self.text_sha1 = None

684

self.executable = None

685

686

def _snapshot_text(self, file_parents, work_tree, commit_builder):

687

"""See InventoryEntry._snapshot_text."""

688

def get_content_byte_lines():

689

return work_tree.get_file(self.file_id).readlines()

690

self.text_sha1, self.text_size = commit_builder.modified_file_text(

691

self.file_id, file_parents, get_content_byte_lines, self.text_sha1, self.text_size)

692

693

def _unchanged(self, previous_ie):

694

"""See InventoryEntry._unchanged."""

695

compatible = super(InventoryFile, self)._unchanged(previous_ie)

696

if self.text_sha1 != previous_ie.text_sha1:

697

compatible = False

698

else:

699

# FIXME: 20050930 probe for the text size when getting sha1

700

# in _read_tree_state

701

self.text_size = previous_ie.text_size

702

if self.executable != previous_ie.executable:

703

compatible = False

704

return compatible

705

706

707

class InventoryLink(InventoryEntry):

708

"""A file in an inventory."""

709

710

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

711

'text_id', 'parent_id', 'children', 'executable',

712

'revision', 'symlink_target']

713

714

def _check(self, checker, rev_id, tree):

715

"""See InventoryEntry._check"""

716

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

717

raise BzrCheckError('symlink {%s} has text in revision {%s}'

718

% (self.file_id, rev_id))

719

if self.symlink_target is None:

720

raise BzrCheckError('symlink {%s} has no target in revision {%s}'

721

% (self.file_id, rev_id))

722

723

def copy(self):

724

other = InventoryLink(self.file_id, self.name, self.parent_id)

725

other.symlink_target = self.symlink_target

726

other.revision = self.revision

727

return other

728

729

def detect_changes(self, old_entry):

730

"""See InventoryEntry.detect_changes."""

731

# FIXME: which _modified field should we use ? RBC 20051003

732

text_modified = (self.symlink_target != old_entry.symlink_target)

733

if text_modified:

734

mutter(" symlink target changed")

735

meta_modified = False

736

return text_modified, meta_modified

737

738

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

739

output_to, reverse=False):

740

"""See InventoryEntry._diff."""

741

from_text = self.symlink_target

742

if to_entry is not None:

743

to_text = to_entry.symlink_target

744

if reverse:

745

temp = from_text

746

from_text = to_text

747

to_text = temp

748

print >>output_to, '=== target changed %r => %r' % (from_text, to_text)

749

else:

750

if not reverse:

751

print >>output_to, '=== target was %r' % self.symlink_target

752

else:

753

print >>output_to, '=== target is %r' % self.symlink_target

754

755

def __init__(self, file_id, name, parent_id):

756

super(InventoryLink, self).__init__(file_id, name, parent_id)

757

self.kind = 'symlink'

758

759

def kind_character(self):

760

"""See InventoryEntry.kind_character."""

761

return ''

762

763

def _put_in_tar(self, item, tree):

764

"""See InventoryEntry._put_in_tar."""

765

item.type = tarfile.SYMTYPE

766

fileobj = None

767

item.size = 0

768

item.mode = 0755

769

item.linkname = self.symlink_target

770

return fileobj

771

772

def _put_on_disk(self, fullpath, tree):

773

"""See InventoryEntry._put_on_disk."""

774

try:

775

os.symlink(self.symlink_target, fullpath)

776

except OSError,e:

777

raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))

778

779

def _read_tree_state(self, path, work_tree):

780

"""See InventoryEntry._read_tree_state."""

781

self.symlink_target = work_tree.get_symlink_target(self.file_id)

782

783

def _forget_tree_state(self):

784

self.symlink_target = None

785

786

def _unchanged(self, previous_ie):

787

"""See InventoryEntry._unchanged."""

788

compatible = super(InventoryLink, self)._unchanged(previous_ie)

789

if self.symlink_target != previous_ie.symlink_target:

790

compatible = False

791

return compatible

792

793

def _snapshot_text(self, file_parents, work_tree, commit_builder):

794

"""See InventoryEntry._snapshot_text."""

795

commit_builder.modified_link(

796

self.file_id, file_parents, self.symlink_target)

797

798

799

class Inventory(object):

250

251

class Inventory(XMLMixin):

800

252

"""Inventory of versioned files in a tree.

801

253

802

254

This describes which file_id is present at each point in the tree,

814

266

inserted, other than through the Inventory API.

815

267

816

268

>>> inv = Inventory()

817

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

818

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT')

269

>>> inv.write_xml(sys.stdout)

270

271

</inventory>

272

>>> inv.add(InventoryEntry('123-123', 'hello.c', 'file', ROOT_ID))

819

273

>>> inv['123-123'].name

820

274

'hello.c'

821

275

829

283

May also look up by name:

830

284

831

285

>>> [x[0] for x in inv.iter_entries()]

832

[u'hello.c']

833

>>> inv = Inventory('TREE_ROOT-12345678-12345678')

834

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

835

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT-12345678-12345678')

286

['hello.c']

287

288

>>> inv.write_xml(sys.stdout)

289

290

291

</inventory>

292

836

293

"""

837

def __init__(self, root_id=ROOT_ID, revision_id=None):

294

def __init__(self):

838

295

"""Create or read an inventory.

839

296

840

297

If a working directory is specified, the inventory is read

844

301

The inventory is created with a default root directory, with

845

302

an id of None.

846

303

"""

847

# We are letting Branch.create() create a unique inventory

848

# root id. Rather than generating a random one here.

849

#if root_id is None:

850

# root_id = bzrlib.branch.gen_file_id('TREE_ROOT')

851

self.root = RootEntry(root_id)

852

self.revision_id = revision_id

304

self.root = RootEntry(ROOT_ID)

853

305

self._byid = {self.root.file_id: self.root}

854

306

855

def copy(self):

856

# TODO: jam 20051218 Should copy also copy the revision_id?

857

other = Inventory(self.root.file_id)

858

# copy recursively so we know directories will be added before

859

# their children. There are more efficient ways than this...

860

for path, entry in self.iter_entries():

861

if entry == self.root:

862

continue

863

other.add(entry.copy())

864

return other

865

307

866

308

def __iter__(self):

867

309

return iter(self._byid)

868

310

311

869

312

def __len__(self):

870

313

"""Returns number of entries."""

871

314

return len(self._byid)

872

315

316

873

317

def iter_entries(self, from_dir=None):

874

318

"""Return (path, entry) pairs, in order by name."""

875

if from_dir is None:

876

assert self.root

877

from_dir = self.root

878

elif isinstance(from_dir, basestring):

879

from_dir = self._byid[from_dir]

880

881

# unrolling the recursive called changed the time from

882

# 440ms/663ms (inline/total) to 116ms/116ms

883

children = from_dir.children.items()

884

children.sort()

885

children = collections.deque(children)

886

stack = [(u'', children)]

887

while stack:

888

from_dir_relpath, children = stack[-1]

889

890

while children:

891

name, ie = children.popleft()

892

893

# we know that from_dir_relpath never ends in a slash

894

# and 'f' doesn't begin with one, we can do a string op, rather

895

# than the checks of pathjoin(), though this means that all paths

896

# start with a slash

897

path = from_dir_relpath + '/' + name

898

899

yield path[1:], ie

900

901

if ie.kind != 'directory':

902

continue

903

904

# But do this child first

905

new_children = ie.children.items()

906

new_children.sort()

907

new_children = collections.deque(new_children)

908

stack.append((path, new_children))

909

# Break out of inner loop, so that we start outer loop with child

910

break

911

else:

912

# if we finished all children, pop it off the stack

913

stack.pop()

914

915

def iter_entries_by_dir(self, from_dir=None):

916

"""Iterate over the entries in a directory first order.

917

918

This returns all entries for a directory before returning

919

the entries for children of a directory. This is not

920

lexicographically sorted order, and is a hybrid between

921

depth-first and breadth-first.

922

923

:return: This yields (path, entry) pairs

924

"""

925

# TODO? Perhaps this should return the from_dir so that the root is

926

# yielded? or maybe an option?

927

if from_dir is None:

928

assert self.root

929

from_dir = self.root

930

elif isinstance(from_dir, basestring):

931

from_dir = self._byid[from_dir]

932

933

stack = [(u'', from_dir)]

934

while stack:

935

cur_relpath, cur_dir = stack.pop()

936

937

child_dirs = []

938

for child_name, child_ie in sorted(cur_dir.children.iteritems()):

939

940

child_relpath = cur_relpath + child_name

941

942

yield child_relpath, child_ie

943

944

if child_ie.kind == 'directory':

945

child_dirs.append((child_relpath+'/', child_ie))

946

stack.extend(reversed(child_dirs))

319

if from_dir == None:

320

assert self.root

321

from_dir = self.root

322

elif isinstance(from_dir, basestring):

323

from_dir = self._byid[from_dir]

324

325

kids = from_dir.children.items()

326

kids.sort()

327

for name, ie in kids:

328

yield name, ie

329

if ie.kind == 'directory':

330

for cn, cie in self.iter_entries(from_dir=ie.file_id):

331

yield os.path.join(name, cn), cie

332

947

333

948

334

def entries(self):

949

335

"""Return list of (path, ie) for all entries except the root.

955

341

kids = dir_ie.children.items()

956

342

kids.sort()

957

343

for name, ie in kids:

958

child_path = pathjoin(dir_path, name)

344

child_path = os.path.join(dir_path, name)

959

345

accum.append((child_path, ie))

960

346

if ie.kind == 'directory':

961

347

descend(ie, child_path)

962

348

963

descend(self.root, u'')

349

descend(self.root, '')

964

350

return accum

965

351

352

966

353

def directories(self):

967

354

"""Return (path, entry) pairs for all directories, including the root.

968

355

"""

974

361

kids.sort()

975

362

976

363

for name, child_ie in kids:

977

child_path = pathjoin(parent_path, name)

364

child_path = os.path.join(parent_path, name)

978

365

descend(child_ie, child_path)

979

descend(self.root, u'')

366

descend(self.root, '')

980

367

return accum

981

368

369

370

982

371

def __contains__(self, file_id):

983

372

"""True if this entry contains a file with given id.

984

373

985

374

>>> inv = Inventory()

986

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

987

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT')

375

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

988

376

>>> '123' in inv

989

377

True

990

378

>>> '456' in inv

992

380

"""

993

381

return file_id in self._byid

994

382

383

995

384

def __getitem__(self, file_id):

996

385

"""Return the entry for given file_id.

997

386

998

387

>>> inv = Inventory()

999

>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))

1000

InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT')

388

>>> inv.add(InventoryEntry('123123', 'hello.c', 'file', ROOT_ID))

1001

389

>>> inv['123123'].name

1002

390

'hello.c'

1003

391

"""

1004

392

try:

1005

393

return self._byid[file_id]

1006

394

except KeyError:

1007

if file_id is None:

395

if file_id == None:

1008

396

raise BzrError("can't look up file_id None")

1009

397

else:

1010

398

raise BzrError("file_id {%s} not in inventory" % file_id)

1011

399

400

1012

401

def get_file_kind(self, file_id):

1013

402

return self._byid[file_id].kind

1014

403

1015

404

def get_child(self, parent_id, filename):

1016

405

return self[parent_id].children.get(filename)

1017

406

407

1018

408

def add(self, entry):

1019

409

"""Add entry to inventory.

1020

410

1021

411

To add a file to a branch ready to be committed, use Branch.add,

1022

which calls this.

1023

1024

Returns the new entry object.

1025

"""

412

which calls this."""

1026

413

if entry.file_id in self._byid:

1027

414

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

1028

415

1029

if entry.parent_id == ROOT_ID or entry.parent_id is None:

1030

entry.parent_id = self.root.file_id

1031

1032

416

try:

1033

417

parent = self._byid[entry.parent_id]

1034

418

except KeyError:

1035

419

raise BzrError("parent_id {%s} not in inventory" % entry.parent_id)

1036

420

1037

if entry.name in parent.children:

421

if parent.children.has_key(entry.name):

1038

422

raise BzrError("%s is already versioned" %

1039

pathjoin(self.id2path(parent.file_id), entry.name))

423

appendpath(self.id2path(parent.file_id), entry.name))

1040

424

1041

425

self._byid[entry.file_id] = entry

1042

426

parent.children[entry.name] = entry

1043

return entry

1044

1045

def add_path(self, relpath, kind, file_id=None, parent_id=None):

427

428

429

def add_path(self, relpath, kind, file_id=None):

1046

430

"""Add entry from a path.

1047

431

1048

The immediate parent must already be versioned.

1049

1050

Returns the new entry object."""

1051

432

The immediate parent must already be versioned"""

1052

433

parts = bzrlib.osutils.splitpath(relpath)

1053

1054

434

if len(parts) == 0:

1055

if file_id is None:

1056

file_id = bzrlib.workingtree.gen_root_id()

1057

self.root = RootEntry(file_id)

1058

self._byid = {self.root.file_id: self.root}

1059

return

1060

else:

1061

parent_path = parts[:-1]

1062

parent_id = self.path2id(parent_path)

1063

if parent_id is None:

1064

raise NotVersionedError(path=parent_path)

1065

ie = make_entry(kind, parts[-1], parent_id, file_id)

435

raise BzrError("cannot re-add root of inventory")

436

437

if file_id == None:

438

file_id = bzrlib.branch.gen_file_id(relpath)

439

440

parent_id = self.path2id(parts[:-1])

441

assert parent_id != None

442

ie = InventoryEntry(file_id, parts[-1],

443

kind=kind, parent_id=parent_id)

1066

444

return self.add(ie)

1067

445

446

1068

447

def __delitem__(self, file_id):

1069

448

"""Remove entry by id.

1070

449

1071

450

>>> inv = Inventory()

1072

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1073

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT')

451

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

1074

452

>>> '123' in inv

1075

453

True

1076

454

>>> del inv['123']

1079

457

"""

1080

458

ie = self[file_id]

1081

459

1082

assert ie.parent_id is None or \

1083

self[ie.parent_id].children[ie.name] == ie

460

assert self[ie.parent_id].children[ie.name] == ie

1084

461

462

# TODO: Test deleting all children; maybe hoist to a separate

463

# deltree method?

464

if ie.kind == 'directory':

465

for cie in ie.children.values():

466

del self[cie.file_id]

467

del ie.children

468

1085

469

del self._byid[file_id]

1086

if ie.parent_id is not None:

1087

del self[ie.parent_id].children[ie.name]

470

del self[ie.parent_id].children[ie.name]

471

472

473

def to_element(self):

474

"""Convert to XML Element"""

475

e = Element('inventory')

476

e.text = '\n'

477

for path, ie in self.iter_entries():

478

e.append(ie.to_element())

479

return e

480

481

482

def from_element(cls, elt):

483

"""Construct from XML Element

484

485

>>> inv = Inventory()

486

>>> inv.add(InventoryEntry('foo.c-123981239', 'foo.c', 'file', ROOT_ID))

487

>>> elt = inv.to_element()

488

>>> inv2 = Inventory.from_element(elt)

489

>>> inv2 == inv

490

True

491

"""

492

assert elt.tag == 'inventory'

493

o = cls()

494

for e in elt:

495

o.add(InventoryEntry.from_element(e))

496

return o

497

498

from_element = classmethod(from_element)

499

1088

500

1089

501

def __eq__(self, other):

1090

502

"""Compare two sets by comparing their contents.

1093

505

>>> i2 = Inventory()

1094

506

>>> i1 == i2

1095

507

True

1096

>>> i1.add(InventoryFile('123', 'foo', ROOT_ID))

1097

InventoryFile('123', 'foo', parent_id='TREE_ROOT')

508

>>> i1.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

1098

509

>>> i1 == i2

1099

510

False

1100

>>> i2.add(InventoryFile('123', 'foo', ROOT_ID))

1101

InventoryFile('123', 'foo', parent_id='TREE_ROOT')

511

>>> i2.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

1102

512

>>> i1 == i2

1103

513

True

1104

514

"""

1111

521

1112

522

return self._byid == other._byid

1113

523

524

1114

525

def __ne__(self, other):

1115

return not self.__eq__(other)

526

return not (self == other)

527

1116

528

1117

529

def __hash__(self):

1118

530

raise ValueError('not hashable')

1119

531

1120

def _iter_file_id_parents(self, file_id):

1121

"""Yield the parents of file_id up to the root."""

1122

while file_id is not None:

1123

try:

1124

ie = self._byid[file_id]

1125

except KeyError:

1126

raise BzrError("file_id {%s} not found in inventory" % file_id)

1127

yield ie

1128

file_id = ie.parent_id

532

1129

533

1130

534

def get_idpath(self, file_id):

1131

535

"""Return a list of file_ids for the path to an entry.

1136

540

root directory as depth 1.

1137

541

"""

1138

542

p = []

1139

for parent in self._iter_file_id_parents(file_id):

1140

p.insert(0, parent.file_id)

543

while file_id != None:

544

try:

545

ie = self._byid[file_id]

546

except KeyError:

547

raise BzrError("file_id {%s} not found in inventory" % file_id)

548

p.insert(0, ie.file_id)

549

file_id = ie.parent_id

1141

550

return p

1142

551

552

1143

553

def id2path(self, file_id):

1144

"""Return as a string the path to file_id.

1145

1146

>>> i = Inventory()

1147

>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))

1148

>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))

1149

>>> print i.id2path('foo-id')

1150

src/foo.c

1151

"""

554

"""Return as a list the path to file_id."""

555

1152

556

# get all names, skipping root

1153

return '/'.join(reversed(

1154

[parent.name for parent in

1155

self._iter_file_id_parents(file_id)][:-1]))

557

p = [self[fid].name for fid in self.get_idpath(file_id)[1:]]

558

return os.sep.join(p)

1156

559

560

561

1157

562

def path2id(self, name):

1158

563

"""Walk down through directories to return entry of last component.

1159

564

1163

568

This returns the entry of the last component in the path,

1164

569

which may be either a file or a directory.

1165

570

1166

Returns None IFF the path is not found.

571

Returns None iff the path is not found.

1167

572

"""

1168

573

if isinstance(name, types.StringTypes):

1169

574

name = splitpath(name)

1170

575

1171

# mutter("lookup path %r" % name)

576

mutter("lookup path %r" % name)

1172

577

1173

578

parent = self.root

1174

579

for f in name:

1183

588

1184

589

return parent.file_id

1185

590

591

1186

592

def has_filename(self, names):

1187

593

return bool(self.path2id(names))

1188

594

595

1189

596

def has_id(self, file_id):

1190

597

return self._byid.has_key(file_id)

1191

598

599

1192

600

def rename(self, file_id, new_parent_id, new_name):

1193

601

"""Move a file within the inventory.

1194

602

1219

627

file_ie.parent_id = new_parent_id

1220

628

1221

629

1222

def make_entry(kind, name, parent_id, file_id=None):

1223

"""Create an inventory entry.

1224

1225

:param kind: the type of inventory entry to create.

1226

:param name: the basename of the entry.

1227

:param parent_id: the parent_id of the entry.

1228

:param file_id: the file_id to use. if None, one will be created.

1229

"""

1230

if file_id is None:

1231

file_id = bzrlib.workingtree.gen_file_id(name)

1232

if kind == 'directory':

1233

return InventoryDirectory(file_id, name, parent_id)

1234

elif kind == 'file':

1235

return InventoryFile(file_id, name, parent_id)

1236

elif kind == 'symlink':

1237

return InventoryLink(file_id, name, parent_id)

1238

else:

1239

raise BzrError("unknown kind %r" % kind)

1240

1241

1242

1243

_NAME_RE = None

630

631

632

_NAME_RE = re.compile(r'^[^/\\]+$')

1244

633

1245

634

def is_valid_name(name):

1246

global _NAME_RE

1247

if _NAME_RE is None:

1248

_NAME_RE = re.compile(r'^[^/\\]+$')

1249

1250

635

return bool(_NAME_RE.match(name))

Older »