~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: John Arbash Meinel
Date: 2006-06-11 03:09:28 UTC
mto: (1711.7.2 win32)
mto: This revision was merged to the branch mainline in revision 1796.
Revision ID: john@arbash-meinel.com-20060611030928-502d4af47bd62fe1

Remove cp437 from the set of encodings, it isn't strictly needed

files added:
BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS.developers

bzrlib/annotate.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/read_bundle.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v07.py

bzrlib/bzrdir.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/identitymap.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/emacs

contrib/emacs/bzr-mode.el

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

foo bar

generate_docs.py

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

files removed:
bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/new-inventory-sample.xml

notes/performance.txt

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

plugins/changeset

plugins/changeset/__init__.py

plugins/changeset/apply_changeset.py

plugins/changeset/common.py

plugins/changeset/gen_changeset.py

plugins/changeset/read_changeset.py

plugins/checkperms

testbzr

testsweet.py

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

plugins/ => bzrlib/plugins/

bzrlib/store.py => bzrlib/store/__init__.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/testbranch.py => bzrlib/tests/branch_implementations/test_branch.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionnamespaces.py

tools/testweave.py => bzrlib/tests/test_weave.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

effbot/ => bzrlib/util/effbot/

elementtree/ => bzrlib/util/elementtree/

urlgrabber/ => bzrlib/util/urlgrabber/

bzrlib/xml.py => bzrlib/xml_serializer.py

bzrlib/newinventory.py => contrib/newinventory.py

bzr-man.py => tools/doc_generate/autodoc_man.py

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/status.py

bzrlib/tests/__init__.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: This refactoring of the workingtree code doesn't seem to keep

# the WorkingTree's copy of the inventory in sync with the branch. The

# branch modifies its working inventory when it does a commit to make

# missing files permanently removed.

# TODO: Maybe also keep the full path of the entry, and the children?

# But those depend on its position within a particular inventory, and

# it would be nice not to need to hold the backpointer here.

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import sys, os.path, types, re

import collections

import os.path

import re

import sys

import tarfile

import types

import bzrlib

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.osutils import uuid, quotefn, splitpath, joinpath, appendpath

from bzrlib.osutils import (pumpfile, quotefn, splitpath, joinpath,

pathjoin, sha_strings)

from bzrlib.errors import (NotVersionedError, InvalidEntryName,

BzrError, BzrCheckError, BinaryFile)

from bzrlib.trace import mutter

class InventoryEntry(object):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

* *file_id*

* *name*: (only the basename within the directory, must not

contain slashes)

* *kind*: "directory" or "file"

* *directory_id*: (if absent/null means the branch root directory)

* *text_sha1*: only for files

* *text_size*: in bytes, only for files

* *text_id*: identifier for the text version, only for files

InventoryEntries can also exist inside a WorkingTree

inventory, in which case they are not yet bound to a

particular revision of the file. In that case the text_sha1,

text_size and text_id are absent.

file_id

name

(within the parent directory)

parent_id

file_id of the parent directory, or ROOT_ID

revision

the revision_id in which this variation of this file was

introduced.

executable

Indicates that this file should be executable on systems

that support it.

text_sha1

sha-1 of the text of the file

text_size

size in bytes of the text of the file

(reading a version 4 tree created a text_id field.)

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryEntry('123', 'src', 'directory', ROOT_ID))

>>> i.add(InventoryEntry('2323', 'hello.c', 'file', parent_id='123'))

>>> for j in i.iter_entries():

... print j

>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))

InventoryDirectory('123', 'src', parent_id='TREE_ROOT')

>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))

InventoryFile('2323', 'hello.c', parent_id='123')

>>> shouldbe = {0: 'src', 1: pathjoin('src','hello.c')}

>>> for ix, j in enumerate(i.iter_entries()):

... print (j[0] == shouldbe[ix], j[1])

...

('src', InventoryEntry('123', 'src', kind='directory', parent_id='TREE_ROOT'))

('src/hello.c', InventoryEntry('2323', 'hello.c', kind='file', parent_id='123'))

>>> i.add(InventoryEntry('2323', 'bye.c', 'file', '123'))

(True, InventoryDirectory('123', 'src', parent_id='TREE_ROOT'))

(True, InventoryFile('2323', 'hello.c', parent_id='123'))

>>> i.add(InventoryFile('2323', 'bye.c', '123'))

Traceback (most recent call last):

...

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryEntry('2324', 'bye.c', 'file', '123'))

>>> i.add(InventoryEntry('2325', 'wibble', 'directory', '123'))

>>> i.add(InventoryFile('2324', 'bye.c', '123'))

InventoryFile('2324', 'bye.c', parent_id='123')

>>> i.add(InventoryDirectory('2325', 'wibble', '123'))

InventoryDirectory('2325', 'wibble', parent_id='123')

>>> i.path2id('src/wibble')

'2325'

>>> '2325' in i

100

True

>>> i.add(InventoryEntry('2326', 'wibble.c', 'file', '2325'))

101

>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))

102

InventoryFile('2326', 'wibble.c', parent_id='2325')

103

>>> i['2326']

InventoryEntry('2326', 'wibble.c', kind='file', parent_id='2325')

>>> for j in i.iter_entries():

... print j[0]

... assert i.path2id(j[0])

104

InventoryFile('2326', 'wibble.c', parent_id='2325')

105

>>> for path, entry in i.iter_entries():

106

... print path

107

... assert i.path2id(path)

108

...

109

src

110

src/bye.c

113

src/wibble/wibble.c

114

>>> i.id2path('2326')

115

'src/wibble/wibble.c'

TODO: Maybe also keep the full path of the entry, and the children?

But those depend on its position within a particular inventory, and

it would be nice not to need to hold the backpointer here.

116

"""

117

# TODO: split InventoryEntry into subclasses for files,

# directories, etc etc.

118

# Constants returned by describe_change()

119

120

# TODO: These should probably move to some kind of FileChangeDescription

121

# class; that's like what's inside a TreeDelta but we want to be able to

122

# generate them just for one file at a time.

123

RENAMED = 'renamed'

124

MODIFIED_AND_RENAMED = 'modified and renamed'

125

126

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

'text_id', 'parent_id', 'children', ]

def __init__(self, file_id, name, kind, parent_id, text_id=None):

127

'text_id', 'parent_id', 'children', 'executable',

128

'revision']

129

130

def detect_changes(self, old_entry):

131

"""Return a (text_modified, meta_modified) from this to old_entry.

132

133

_read_tree_state must have been called on self and old_entry prior to

134

calling detect_changes.

135

"""

136

return False, False

137

138

def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

139

output_to, reverse=False):

140

"""Perform a diff from this to to_entry.

141

142

text_diff will be used for textual difference calculation.

143

This is a template method, override _diff in child classes.

144

"""

145

self._read_tree_state(tree.id2path(self.file_id), tree)

146

if to_entry:

147

# cannot diff from one kind to another - you must do a removal

148

# and an addif they do not match.

149

assert self.kind == to_entry.kind

150

to_entry._read_tree_state(to_tree.id2path(to_entry.file_id),

151

to_tree)

152

self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,

153

output_to, reverse)

154

155

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

156

output_to, reverse=False):

157

"""Perform a diff between two entries of the same kind."""

158

159

def find_previous_heads(self, previous_inventories,

160

versioned_file_store,

161

transaction,

162

entry_vf=None):

163

"""Return the revisions and entries that directly preceed this.

164

165

Returned as a map from revision to inventory entry.

166

167

This is a map containing the file revisions in all parents

168

for which the file exists, and its revision is not a parent of

169

any other. If the file is new, the set will be empty.

170

171

:param versioned_file_store: A store where ancestry data on this

172

file id can be queried.

173

:param transaction: The transaction that queries to the versioned

174

file store should be completed under.

175

:param entry_vf: The entry versioned file, if its already available.

176

"""

177

def get_ancestors(weave, entry):

178

return set(weave.get_ancestry(entry.revision))

179

# revision:ie mapping for each ie found in previous_inventories.

180

candidates = {}

181

# revision:ie mapping with one revision for each head.

182

heads = {}

183

# revision: ancestor list for each head

184

head_ancestors = {}

185

# identify candidate head revision ids.

186

for inv in previous_inventories:

187

if self.file_id in inv:

188

ie = inv[self.file_id]

189

assert ie.file_id == self.file_id

190

if ie.revision in candidates:

191

# same revision value in two different inventories:

192

# correct possible inconsistencies:

193

# * there was a bug in revision updates with 'x' bit

194

# support.

195

try:

196

if candidates[ie.revision].executable != ie.executable:

197

candidates[ie.revision].executable = False

198

ie.executable = False

199

except AttributeError:

200

pass

201

# must now be the same.

202

assert candidates[ie.revision] == ie

203

else:

204

# add this revision as a candidate.

205

candidates[ie.revision] = ie

206

207

# common case optimisation

208

if len(candidates) == 1:

209

# if there is only one candidate revision found

210

# then we can opening the versioned file to access ancestry:

211

# there cannot be any ancestors to eliminate when there is

212

# only one revision available.

213

heads[ie.revision] = ie

214

return heads

215

216

# eliminate ancestors amongst the available candidates:

217

# heads are those that are not an ancestor of any other candidate

218

# - this provides convergence at a per-file level.

219

for ie in candidates.values():

220

# may be an ancestor of a known head:

221

already_present = 0 != len(

222

[head for head in heads

223

if ie.revision in head_ancestors[head]])

224

if already_present:

225

# an ancestor of an analyzed candidate.

226

continue

227

# not an ancestor of a known head:

228

# load the versioned file for this file id if needed

229

if entry_vf is None:

230

entry_vf = versioned_file_store.get_weave_or_empty(

231

self.file_id, transaction)

232

ancestors = get_ancestors(entry_vf, ie)

233

# may knock something else out:

234

check_heads = list(heads.keys())

235

for head in check_heads:

236

if head in ancestors:

237

# this previously discovered 'head' is not

238

# really a head - its an ancestor of the newly

239

# found head,

240

heads.pop(head)

241

head_ancestors[ie.revision] = ancestors

242

heads[ie.revision] = ie

243

return heads

244

245

def get_tar_item(self, root, dp, now, tree):

246

"""Get a tarfile item and a file stream for its content."""

247

item = tarfile.TarInfo(pathjoin(root, dp))

248

# TODO: would be cool to actually set it to the timestamp of the

249

# revision it was last changed

250

item.mtime = now

251

fileobj = self._put_in_tar(item, tree)

252

return item, fileobj

253

254

def has_text(self):

255

"""Return true if the object this entry represents has textual data.

256

257

Note that textual data includes binary content.

258

259

Also note that all entries get weave files created for them.

260

This attribute is primarily used when upgrading from old trees that

261

did not have the weave index for all inventory entries.

262

"""

263

return False

264

265

def __init__(self, file_id, name, parent_id, text_id=None):

266

"""Create an InventoryEntry

100

267

101

268

The filename must be a single component, relative to the

102

269

parent directory; it cannot be a whole path or relative name.

103

270

104

>>> e = InventoryEntry('123', 'hello.c', 'file', ROOT_ID)

271

>>> e = InventoryFile('123', 'hello.c', ROOT_ID)

105

272

>>> e.name

106

273

'hello.c'

107

274

>>> e.file_id

108

275

'123'

109

>>> e = InventoryEntry('123', 'src/hello.c', 'file', ROOT_ID)

276

>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)

110

277

Traceback (most recent call last):

111

BzrCheckError: InventoryEntry name 'src/hello.c' is invalid

278

InvalidEntryName: Invalid entry name: src/hello.c

112

279

"""

280

assert isinstance(name, basestring), name

113

281

if '/' in name or '\\' in name:

114

raise BzrCheckError('InventoryEntry name %r is invalid' % name)

115

282

raise InvalidEntryName(name=name)

283

self.executable = False

284

self.revision = None

116

285

self.text_sha1 = None

117

286

self.text_size = None

118

119

287

self.file_id = file_id

120

288

self.name = name

121

self.kind = kind

122

289

self.text_id = text_id

123

290

self.parent_id = parent_id

124

if kind == 'directory':

125

self.children = {}

126

elif kind == 'file':

127

pass

128

else:

129

raise BzrError("unhandled entry kind %r" % kind)

130

131

291

self.symlink_target = None

292

293

def kind_character(self):

294

"""Return a short kind indicator useful for appending to names."""

295

raise BzrError('unknown kind %r' % self.kind)

296

297

known_kinds = ('file', 'directory', 'symlink', 'root_directory')

298

299

def _put_in_tar(self, item, tree):

300

"""populate item for stashing in a tar, and return the content stream.

301

302

If no content is available, return None.

303

"""

304

raise BzrError("don't know how to export {%s} of kind %r" %

305

(self.file_id, self.kind))

306

307

def put_on_disk(self, dest, dp, tree):

308

"""Create a representation of self on disk in the prefix dest.

309

310

This is a template method - implement _put_on_disk in subclasses.

311

"""

312

fullpath = pathjoin(dest, dp)

313

self._put_on_disk(fullpath, tree)

314

mutter(" export {%s} kind %s to %s", self.file_id,

315

self.kind, fullpath)

316

317

def _put_on_disk(self, fullpath, tree):

318

"""Put this entry onto disk at fullpath, from tree tree."""

319

raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))

132

320

133

321

def sorted_children(self):

134

322

l = self.children.items()

135

323

l.sort()

136

324

return l

137

325

326

@staticmethod

327

def versionable_kind(kind):

328

return kind in ('file', 'directory', 'symlink')

329

330

def check(self, checker, rev_id, inv, tree):

331

"""Check this inventory entry is intact.

332

333

This is a template method, override _check for kind specific

334

tests.

335

336

:param checker: Check object providing context for the checks;

337

can be used to find out what parts of the repository have already

338

been checked.

339

:param rev_id: Revision id from which this InventoryEntry was loaded.

340

Not necessarily the last-changed revision for this file.

341

:param inv: Inventory from which the entry was loaded.

342

:param tree: RevisionTree for this entry.

343

"""

344

if self.parent_id != None:

345

if not inv.has_id(self.parent_id):

346

raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'

347

% (self.parent_id, rev_id))

348

self._check(checker, rev_id, tree)

349

350

def _check(self, checker, rev_id, tree):

351

"""Check this inventory entry for kind specific errors."""

352

raise BzrCheckError('unknown entry kind %r in revision {%s}' %

353

(self.kind, rev_id))

138

354

139

355

def copy(self):

140

other = InventoryEntry(self.file_id, self.name, self.kind,

141

self.parent_id, text_id=self.text_id)

142

other.text_sha1 = self.text_sha1

143

other.text_size = self.text_size

144

# note that children are *not* copied; they're pulled across when

145

# others are added

146

return other

147

356

"""Clone this inventory entry."""

357

raise NotImplementedError

358

359

@staticmethod

360

def describe_change(old_entry, new_entry):

361

"""Describe the change between old_entry and this.

362

363

This smells of being an InterInventoryEntry situation, but as its

364

the first one, we're making it a static method for now.

365

366

An entry with a different parent, or different name is considered

367

to be renamed. Reparenting is an internal detail.

368

Note that renaming the parent does not trigger a rename for the

369

child entry itself.

370

"""

371

# TODO: Perhaps return an object rather than just a string

372

if old_entry is new_entry:

373

# also the case of both being None

374

return 'unchanged'

375

elif old_entry is None:

376

return 'added'

377

elif new_entry is None:

378

return 'removed'

379

text_modified, meta_modified = new_entry.detect_changes(old_entry)

380

if text_modified or meta_modified:

381

modified = True

382

else:

383

modified = False

384

# TODO 20060511 (mbp, rbc) factor out 'detect_rename' here.

385

if old_entry.parent_id != new_entry.parent_id:

386

renamed = True

387

elif old_entry.name != new_entry.name:

388

renamed = True

389

else:

390

renamed = False

391

if renamed and not modified:

392

return InventoryEntry.RENAMED

393

if modified and not renamed:

394

return 'modified'

395

if modified and renamed:

396

return InventoryEntry.MODIFIED_AND_RENAMED

397

return 'unchanged'

148

398

149

399

def __repr__(self):

150

return ("%s(%r, %r, kind=%r, parent_id=%r)"

400

return ("%s(%r, %r, parent_id=%r)"

151

401

% (self.__class__.__name__,

152

402

self.file_id,

153

403

self.name,

154

self.kind,

155

404

self.parent_id))

156

405

157

158

def to_element(self):

159

"""Convert to XML element"""

160

from bzrlib.xml import Element

161

162

e = Element('entry')

163

164

e.set('name', self.name)

165

e.set('file_id', self.file_id)

166

e.set('kind', self.kind)

167

168

if self.text_size != None:

169

e.set('text_size', '%d' % self.text_size)

170

171

for f in ['text_id', 'text_sha1']:

172

v = getattr(self, f)

173

if v != None:

174

e.set(f, v)

175

176

# to be conservative, we don't externalize the root pointers

177

# for now, leaving them as null in the xml form. in a future

178

# version it will be implied by nested elements.

179

if self.parent_id != ROOT_ID:

180

assert isinstance(self.parent_id, basestring)

181

e.set('parent_id', self.parent_id)

182

183

e.tail = '\n'

184

185

return e

186

187

188

def from_element(cls, elt):

189

assert elt.tag == 'entry'

190

191

## original format inventories don't have a parent_id for

192

## nodes in the root directory, but it's cleaner to use one

193

## internally.

194

parent_id = elt.get('parent_id')

195

if parent_id == None:

196

parent_id = ROOT_ID

197

198

self = cls(elt.get('file_id'), elt.get('name'), elt.get('kind'), parent_id)

199

self.text_id = elt.get('text_id')

200

self.text_sha1 = elt.get('text_sha1')

201

202

## mutter("read inventoryentry: %r" % (elt.attrib))

203

204

v = elt.get('text_size')

205

self.text_size = v and int(v)

206

207

return self

208

209

210

from_element = classmethod(from_element)

406

def snapshot(self, revision, path, previous_entries,

407

work_tree, commit_builder):

408

"""Make a snapshot of this entry which may or may not have changed.

409

410

This means that all its fields are populated, that it has its

411

text stored in the text store or weave.

412

"""

413

mutter('new parents of %s are %r', path, previous_entries)

414

self._read_tree_state(path, work_tree)

415

# TODO: Where should we determine whether to reuse a

416

# previous revision id or create a new revision? 20060606

417

if len(previous_entries) == 1:

418

# cannot be unchanged unless there is only one parent file rev.

419

parent_ie = previous_entries.values()[0]

420

if self._unchanged(parent_ie):

421

mutter("found unchanged entry")

422

self.revision = parent_ie.revision

423

return "unchanged"

424

return self._snapshot_into_revision(revision, previous_entries,

425

work_tree, commit_builder)

426

427

def _snapshot_into_revision(self, revision, previous_entries, work_tree,

428

commit_builder):

429

"""Record this revision unconditionally into a store.

430

431

The entry's last-changed revision property (`revision`) is updated to

432

that of the new revision.

433

434

:param revision: id of the new revision that is being recorded.

435

436

:returns: String description of the commit (e.g. "merged", "modified"), etc.

437

"""

438

mutter('new revision {%s} for {%s}', revision, self.file_id)

439

self.revision = revision

440

self._snapshot_text(previous_entries, work_tree, commit_builder)

441

442

def _snapshot_text(self, file_parents, work_tree, commit_builder):

443

"""Record the 'text' of this entry, whatever form that takes.

444

445

This default implementation simply adds an empty text.

446

"""

447

raise NotImplementedError(self._snapshot_text)

211

448

212

449

def __eq__(self, other):

213

450

if not isinstance(other, InventoryEntry):

214

451

return NotImplemented

215

452

216

return (self.file_id == other.file_id) \

217

and (self.name == other.name) \

218

and (self.text_sha1 == other.text_sha1) \

219

and (self.text_size == other.text_size) \

220

and (self.text_id == other.text_id) \

221

and (self.parent_id == other.parent_id) \

222

and (self.kind == other.kind)

223

453

return ((self.file_id == other.file_id)

454

and (self.name == other.name)

455

and (other.symlink_target == self.symlink_target)

456

and (self.text_sha1 == other.text_sha1)

457

and (self.text_size == other.text_size)

458

and (self.text_id == other.text_id)

459

and (self.parent_id == other.parent_id)

460

and (self.kind == other.kind)

461

and (self.revision == other.revision)

462

and (self.executable == other.executable)

463

)

224

464

225

465

def __ne__(self, other):

226

466

return not (self == other)

228

468

def __hash__(self):

229

469

raise ValueError('not hashable')

230

470

471

def _unchanged(self, previous_ie):

472

"""Has this entry changed relative to previous_ie.

473

474

This method should be overriden in child classes.

475

"""

476

compatible = True

477

# different inv parent

478

if previous_ie.parent_id != self.parent_id:

479

compatible = False

480

# renamed

481

elif previous_ie.name != self.name:

482

compatible = False

483

return compatible

484

485

def _read_tree_state(self, path, work_tree):

486

"""Populate fields in the inventory entry from the given tree.

487

488

Note that this should be modified to be a noop on virtual trees

489

as all entries created there are prepopulated.

490

"""

491

# TODO: Rather than running this manually, we should check the

492

# working sha1 and other expensive properties when they're

493

# first requested, or preload them if they're already known

494

pass # nothing to do by default

495

496

def _forget_tree_state(self):

497

pass

231

498

232

499

233

500

class RootEntry(InventoryEntry):

501

502

def _check(self, checker, rev_id, tree):

503

"""See InventoryEntry._check"""

504

234

505

def __init__(self, file_id):

235

506

self.file_id = file_id

236

507

self.children = {}

237

508

self.kind = 'root_directory'

238

509

self.parent_id = None

239

self.name = ''

510

self.name = u''

240

511

241

512

def __eq__(self, other):

242

513

if not isinstance(other, RootEntry):

246

517

and (self.children == other.children)

247

518

248

519

520

class InventoryDirectory(InventoryEntry):

521

"""A directory in an inventory."""

522

523

def _check(self, checker, rev_id, tree):

524

"""See InventoryEntry._check"""

525

if self.text_sha1 != None or self.text_size != None or self.text_id != None:

526

raise BzrCheckError('directory {%s} has text in revision {%s}'

527

% (self.file_id, rev_id))

528

529

def copy(self):

530

other = InventoryDirectory(self.file_id, self.name, self.parent_id)

531

other.revision = self.revision

532

# note that children are *not* copied; they're pulled across when

533

# others are added

534

return other

535

536

def __init__(self, file_id, name, parent_id):

537

super(InventoryDirectory, self).__init__(file_id, name, parent_id)

538

self.children = {}

539

self.kind = 'directory'

540

541

def kind_character(self):

542

"""See InventoryEntry.kind_character."""

543

return '/'

544

545

def _put_in_tar(self, item, tree):

546

"""See InventoryEntry._put_in_tar."""

547

item.type = tarfile.DIRTYPE

548

fileobj = None

549

item.name += '/'

550

item.size = 0

551

item.mode = 0755

552

return fileobj

553

554

def _put_on_disk(self, fullpath, tree):

555

"""See InventoryEntry._put_on_disk."""

556

os.mkdir(fullpath)

557

558

def _snapshot_text(self, file_parents, work_tree, commit_builder):

559

"""See InventoryEntry._snapshot_text."""

560

commit_builder.modified_directory(self.file_id, file_parents)

561

562

563

class InventoryFile(InventoryEntry):

564

"""A file in an inventory."""

565

566

def _check(self, checker, tree_revision_id, tree):

567

"""See InventoryEntry._check"""

568

t = (self.file_id, self.revision)

569

if t in checker.checked_texts:

570

prev_sha = checker.checked_texts[t]

571

if prev_sha != self.text_sha1:

572

raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %

573

(self.file_id, tree_revision_id))

574

else:

575

checker.repeated_text_cnt += 1

576

return

577

578

if self.file_id not in checker.checked_weaves:

579

mutter('check weave {%s}', self.file_id)

580

w = tree.get_weave(self.file_id)

581

# Not passing a progress bar, because it creates a new

582

# progress, which overwrites the current progress,

583

# and doesn't look nice

584

w.check()

585

checker.checked_weaves[self.file_id] = True

586

else:

587

w = tree.get_weave(self.file_id)

588

589

mutter('check version {%s} of {%s}', tree_revision_id, self.file_id)

590

checker.checked_text_cnt += 1

591

# We can't check the length, because Weave doesn't store that

592

# information, and the whole point of looking at the weave's

593

# sha1sum is that we don't have to extract the text.

594

if self.text_sha1 != w.get_sha1(self.revision):

595

raise BzrCheckError('text {%s} version {%s} wrong sha1'

596

% (self.file_id, self.revision))

597

checker.checked_texts[t] = self.text_sha1

598

599

def copy(self):

600

other = InventoryFile(self.file_id, self.name, self.parent_id)

601

other.executable = self.executable

602

other.text_id = self.text_id

603

other.text_sha1 = self.text_sha1

604

other.text_size = self.text_size

605

other.revision = self.revision

606

return other

607

608

def detect_changes(self, old_entry):

609

"""See InventoryEntry.detect_changes."""

610

assert self.text_sha1 != None

611

assert old_entry.text_sha1 != None

612

text_modified = (self.text_sha1 != old_entry.text_sha1)

613

meta_modified = (self.executable != old_entry.executable)

614

return text_modified, meta_modified

615

616

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

617

output_to, reverse=False):

618

"""See InventoryEntry._diff."""

619

try:

620

from_text = tree.get_file(self.file_id).readlines()

621

if to_entry:

622

to_text = to_tree.get_file(to_entry.file_id).readlines()

623

else:

624

to_text = []

625

if not reverse:

626

text_diff(from_label, from_text,

627

to_label, to_text, output_to)

628

else:

629

text_diff(to_label, to_text,

630

from_label, from_text, output_to)

631

except BinaryFile:

632

if reverse:

633

label_pair = (to_label, from_label)

634

else:

635

label_pair = (from_label, to_label)

636

print >> output_to, "Binary files %s and %s differ" % label_pair

637

638

def has_text(self):

639

"""See InventoryEntry.has_text."""

640

return True

641

642

def __init__(self, file_id, name, parent_id):

643

super(InventoryFile, self).__init__(file_id, name, parent_id)

644

self.kind = 'file'

645

646

def kind_character(self):

647

"""See InventoryEntry.kind_character."""

648

return ''

649

650

def _put_in_tar(self, item, tree):

651

"""See InventoryEntry._put_in_tar."""

652

item.type = tarfile.REGTYPE

653

fileobj = tree.get_file(self.file_id)

654

item.size = self.text_size

655

if tree.is_executable(self.file_id):

656

item.mode = 0755

657

else:

658

item.mode = 0644

659

return fileobj

660

661

def _put_on_disk(self, fullpath, tree):

662

"""See InventoryEntry._put_on_disk."""

663

pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))

664

if tree.is_executable(self.file_id):

665

os.chmod(fullpath, 0755)

666

667

def _read_tree_state(self, path, work_tree):

668

"""See InventoryEntry._read_tree_state."""

669

self.text_sha1 = work_tree.get_file_sha1(self.file_id, path=path)

670

# FIXME: 20050930 probe for the text size when getting sha1

671

# in _read_tree_state

672

self.executable = work_tree.is_executable(self.file_id, path=path)

673

674

def _forget_tree_state(self):

675

self.text_sha1 = None

676

self.executable = None

677

678

def _snapshot_text(self, file_parents, work_tree, commit_builder):

679

"""See InventoryEntry._snapshot_text."""

680

def get_content_byte_lines():

681

return work_tree.get_file(self.file_id).readlines()

682

self.text_sha1, self.text_size = commit_builder.modified_file_text(

683

self.file_id, file_parents, get_content_byte_lines, self.text_sha1, self.text_size)

684

685

def _unchanged(self, previous_ie):

686

"""See InventoryEntry._unchanged."""

687

compatible = super(InventoryFile, self)._unchanged(previous_ie)

688

if self.text_sha1 != previous_ie.text_sha1:

689

compatible = False

690

else:

691

# FIXME: 20050930 probe for the text size when getting sha1

692

# in _read_tree_state

693

self.text_size = previous_ie.text_size

694

if self.executable != previous_ie.executable:

695

compatible = False

696

return compatible

697

698

699

class InventoryLink(InventoryEntry):

700

"""A file in an inventory."""

701

702

__slots__ = ['symlink_target']

703

704

def _check(self, checker, rev_id, tree):

705

"""See InventoryEntry._check"""

706

if self.text_sha1 != None or self.text_size != None or self.text_id != None:

707

raise BzrCheckError('symlink {%s} has text in revision {%s}'

708

% (self.file_id, rev_id))

709

if self.symlink_target is None:

710

raise BzrCheckError('symlink {%s} has no target in revision {%s}'

711

% (self.file_id, rev_id))

712

713

def copy(self):

714

other = InventoryLink(self.file_id, self.name, self.parent_id)

715

other.symlink_target = self.symlink_target

716

other.revision = self.revision

717

return other

718

719

def detect_changes(self, old_entry):

720

"""See InventoryEntry.detect_changes."""

721

# FIXME: which _modified field should we use ? RBC 20051003

722

text_modified = (self.symlink_target != old_entry.symlink_target)

723

if text_modified:

724

mutter(" symlink target changed")

725

meta_modified = False

726

return text_modified, meta_modified

727

728

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

729

output_to, reverse=False):

730

"""See InventoryEntry._diff."""

731

from_text = self.symlink_target

732

if to_entry is not None:

733

to_text = to_entry.symlink_target

734

if reverse:

735

temp = from_text

736

from_text = to_text

737

to_text = temp

738

print >>output_to, '=== target changed %r => %r' % (from_text, to_text)

739

else:

740

if not reverse:

741

print >>output_to, '=== target was %r' % self.symlink_target

742

else:

743

print >>output_to, '=== target is %r' % self.symlink_target

744

745

def __init__(self, file_id, name, parent_id):

746

super(InventoryLink, self).__init__(file_id, name, parent_id)

747

self.kind = 'symlink'

748

749

def kind_character(self):

750

"""See InventoryEntry.kind_character."""

751

return ''

752

753

def _put_in_tar(self, item, tree):

754

"""See InventoryEntry._put_in_tar."""

755

item.type = tarfile.SYMTYPE

756

fileobj = None

757

item.size = 0

758

item.mode = 0755

759

item.linkname = self.symlink_target

760

return fileobj

761

762

def _put_on_disk(self, fullpath, tree):

763

"""See InventoryEntry._put_on_disk."""

764

try:

765

os.symlink(self.symlink_target, fullpath)

766

except OSError,e:

767

raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))

768

769

def _read_tree_state(self, path, work_tree):

770

"""See InventoryEntry._read_tree_state."""

771

self.symlink_target = work_tree.get_symlink_target(self.file_id)

772

773

def _forget_tree_state(self):

774

self.symlink_target = None

775

776

def _unchanged(self, previous_ie):

777

"""See InventoryEntry._unchanged."""

778

compatible = super(InventoryLink, self)._unchanged(previous_ie)

779

if self.symlink_target != previous_ie.symlink_target:

780

compatible = False

781

return compatible

782

783

def _snapshot_text(self, file_parents, work_tree, commit_builder):

784

"""See InventoryEntry._snapshot_text."""

785

commit_builder.modified_link(

786

self.file_id, file_parents, self.symlink_target)

787

249

788

250

789

class Inventory(object):

251

790

"""Inventory of versioned files in a tree.

265

804

inserted, other than through the Inventory API.

266

805

267

806

>>> inv = Inventory()

268

>>> inv.add(InventoryEntry('123-123', 'hello.c', 'file', ROOT_ID))

807

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

808

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT')

269

809

>>> inv['123-123'].name

270

810

'hello.c'

271

811

279

819

May also look up by name:

280

820

281

821

>>> [x[0] for x in inv.iter_entries()]

282

['hello.c']

822

[u'hello.c']

283

823

>>> inv = Inventory('TREE_ROOT-12345678-12345678')

284

>>> inv.add(InventoryEntry('123-123', 'hello.c', 'file', ROOT_ID))

824

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

825

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT-12345678-12345678')

285

826

"""

286

def __init__(self, root_id=ROOT_ID):

827

def __init__(self, root_id=ROOT_ID, revision_id=None):

287

828

"""Create or read an inventory.

288

829

289

830

If a working directory is specified, the inventory is read

293

834

The inventory is created with a default root directory, with

294

835

an id of None.

295

836

"""

296

# We are letting Branch(init=True) create a unique inventory

837

# We are letting Branch.create() create a unique inventory

297

838

# root id. Rather than generating a random one here.

298

839

#if root_id is None:

299

840

# root_id = bzrlib.branch.gen_file_id('TREE_ROOT')

300

841

self.root = RootEntry(root_id)

842

self.revision_id = revision_id

301

843

self._byid = {self.root.file_id: self.root}

302

844

845

def copy(self):

846

# TODO: jam 20051218 Should copy also copy the revision_id?

847

other = Inventory(self.root.file_id)

848

# copy recursively so we know directories will be added before

849

# their children. There are more efficient ways than this...

850

for path, entry in self.iter_entries():

851

if entry == self.root:

852

continue

853

other.add(entry.copy())

854

return other

303

855

304

856

def __iter__(self):

305

857

return iter(self._byid)

306

858

307

308

859

def __len__(self):

309

860

"""Returns number of entries."""

310

861

return len(self._byid)

311

862

312

313

863

def iter_entries(self, from_dir=None):

314

864

"""Return (path, entry) pairs, in order by name."""

315

if from_dir == None:

316

assert self.root

317

from_dir = self.root

318

elif isinstance(from_dir, basestring):

319

from_dir = self._byid[from_dir]

320

321

kids = from_dir.children.items()

322

kids.sort()

323

for name, ie in kids:

324

yield name, ie

325

if ie.kind == 'directory':

326

for cn, cie in self.iter_entries(from_dir=ie.file_id):

327

yield os.path.join(name, cn), cie

328

865

if from_dir is None:

866

assert self.root

867

from_dir = self.root

868

elif isinstance(from_dir, basestring):

869

from_dir = self._byid[from_dir]

870

871

# unrolling the recursive called changed the time from

872

# 440ms/663ms (inline/total) to 116ms/116ms

873

children = from_dir.children.items()

874

children.sort()

875

children = collections.deque(children)

876

stack = [(u'', children)]

877

while stack:

878

from_dir_relpath, children = stack[-1]

879

880

while children:

881

name, ie = children.popleft()

882

883

# we know that from_dir_relpath never ends in a slash

884

# and 'f' doesn't begin with one, we can do a string op, rather

885

# than the checks of pathjoin(), though this means that all paths

886

# start with a slash

887

path = from_dir_relpath + '/' + name

888

889

yield path[1:], ie

890

891

if ie.kind != 'directory':

892

continue

893

894

# But do this child first

895

new_children = ie.children.items()

896

new_children.sort()

897

new_children = collections.deque(new_children)

898

stack.append((path, new_children))

899

# Break out of inner loop, so that we start outer loop with child

900

break

901

else:

902

# if we finished all children, pop it off the stack

903

stack.pop()

904

905

def iter_entries_by_dir(self, from_dir=None):

906

"""Iterate over the entries in a directory first order.

907

908

This returns all entries for a directory before returning

909

the entries for children of a directory. This is not

910

lexicographically sorted order, and is a hybrid between

911

depth-first and breadth-first.

912

913

:return: This yields (path, entry) pairs

914

"""

915

# TODO? Perhaps this should return the from_dir so that the root is

916

# yielded? or maybe an option?

917

if from_dir is None:

918

assert self.root

919

from_dir = self.root

920

elif isinstance(from_dir, basestring):

921

from_dir = self._byid[from_dir]

922

923

stack = [(u'', from_dir)]

924

while stack:

925

cur_relpath, cur_dir = stack.pop()

926

927

child_dirs = []

928

for child_name, child_ie in sorted(cur_dir.children.iteritems()):

929

930

child_relpath = cur_relpath + child_name

931

932

yield child_relpath, child_ie

933

934

if child_ie.kind == 'directory':

935

child_dirs.append((child_relpath+'/', child_ie))

936

stack.extend(reversed(child_dirs))

329

937

330

938

def entries(self):

331

939

"""Return list of (path, ie) for all entries except the root.

337

945

kids = dir_ie.children.items()

338

946

kids.sort()

339

947

for name, ie in kids:

340

child_path = os.path.join(dir_path, name)

948

child_path = pathjoin(dir_path, name)

341

949

accum.append((child_path, ie))

342

950

if ie.kind == 'directory':

343

951

descend(ie, child_path)

344

952

345

descend(self.root, '')

953

descend(self.root, u'')

346

954

return accum

347

955

348

349

956

def directories(self):

350

957

"""Return (path, entry) pairs for all directories, including the root.

351

958

"""

357

964

kids.sort()

358

965

359

966

for name, child_ie in kids:

360

child_path = os.path.join(parent_path, name)

967

child_path = pathjoin(parent_path, name)

361

968

descend(child_ie, child_path)

362

descend(self.root, '')

969

descend(self.root, u'')

363

970

return accum

364

971

365

366

367

972

def __contains__(self, file_id):

368

973

"""True if this entry contains a file with given id.

369

974

370

975

>>> inv = Inventory()

371

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

976

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

977

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT')

372

978

>>> '123' in inv

373

979

True

374

980

>>> '456' in inv

376

982

"""

377

983

return file_id in self._byid

378

984

379

380

985

def __getitem__(self, file_id):

381

986

"""Return the entry for given file_id.

382

987

383

988

>>> inv = Inventory()

384

>>> inv.add(InventoryEntry('123123', 'hello.c', 'file', ROOT_ID))

989

>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))

990

InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT')

385

991

>>> inv['123123'].name

386

992

'hello.c'

387

993

"""

388

994

try:

389

995

return self._byid[file_id]

390

996

except KeyError:

391

if file_id == None:

997

if file_id is None:

392

998

raise BzrError("can't look up file_id None")

393

999

else:

394

1000

raise BzrError("file_id {%s} not in inventory" % file_id)

395

1001

396

397

1002

def get_file_kind(self, file_id):

398

1003

return self._byid[file_id].kind

399

1004

400

1005

def get_child(self, parent_id, filename):

401

1006

return self[parent_id].children.get(filename)

402

1007

403

404

1008

def add(self, entry):

405

1009

"""Add entry to inventory.

406

1010

407

1011

To add a file to a branch ready to be committed, use Branch.add,

408

which calls this."""

1012

which calls this.

1013

1014

Returns the new entry object.

1015

"""

409

1016

if entry.file_id in self._byid:

410

1017

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

411

1018

419

1026

420

1027

if parent.children.has_key(entry.name):

421

1028

raise BzrError("%s is already versioned" %

422

appendpath(self.id2path(parent.file_id), entry.name))

1029

pathjoin(self.id2path(parent.file_id), entry.name))

423

1030

424

1031

self._byid[entry.file_id] = entry

425

1032

parent.children[entry.name] = entry

426

427

428

def add_path(self, relpath, kind, file_id=None):

1033

return entry

1034

1035

def add_path(self, relpath, kind, file_id=None, parent_id=None):

429

1036

"""Add entry from a path.

430

1037

431

The immediate parent must already be versioned"""

432

from bzrlib.errors import NotVersionedError

1038

The immediate parent must already be versioned.

1039

1040

Returns the new entry object."""

433

1041

434

1042

parts = bzrlib.osutils.splitpath(relpath)

1043

435

1044

if len(parts) == 0:

436

raise BzrError("cannot re-add root of inventory")

437

438

if file_id == None:

439

from bzrlib.branch import gen_file_id

440

file_id = gen_file_id(relpath)

441

442

parent_path = parts[:-1]

443

parent_id = self.path2id(parent_path)

444

if parent_id == None:

445

raise NotVersionedError(parent_path)

446

447

ie = InventoryEntry(file_id, parts[-1],

448

kind=kind, parent_id=parent_id)

1045

if file_id is None:

1046

file_id = bzrlib.workingtree.gen_root_id()

1047

self.root = RootEntry(file_id)

1048

self._byid = {self.root.file_id: self.root}

1049

return

1050

else:

1051

parent_path = parts[:-1]

1052

parent_id = self.path2id(parent_path)

1053

if parent_id is None:

1054

raise NotVersionedError(path=parent_path)

1055

ie = make_entry(kind, parts[-1], parent_id, file_id)

449

1056

return self.add(ie)

450

1057

451

452

1058

def __delitem__(self, file_id):

453

1059

"""Remove entry by id.

454

1060

455

1061

>>> inv = Inventory()

456

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

1062

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1063

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT')

457

1064

>>> '123' in inv

458

1065

True

459

1066

>>> del inv['123']

462

1069

"""

463

1070

ie = self[file_id]

464

1071

465

assert self[ie.parent_id].children[ie.name] == ie

1072

assert ie.parent_id is None or \

1073

self[ie.parent_id].children[ie.name] == ie

466

1074

467

# TODO: Test deleting all children; maybe hoist to a separate

468

# deltree method?

469

if ie.kind == 'directory':

470

for cie in ie.children.values():

471

del self[cie.file_id]

472

del ie.children

473

474

1075

del self._byid[file_id]

475

del self[ie.parent_id].children[ie.name]

476

477

478

def to_element(self):

479

"""Convert to XML Element"""

480

from bzrlib.xml import Element

481

482

e = Element('inventory')

483

e.text = '\n'

484

if self.root.file_id not in (None, ROOT_ID):

485

e.set('file_id', self.root.file_id)

486

for path, ie in self.iter_entries():

487

e.append(ie.to_element())

488

return e

489

490

491

def from_element(cls, elt):

492

"""Construct from XML Element

493

494

>>> inv = Inventory()

495

>>> inv.add(InventoryEntry('foo.c-123981239', 'foo.c', 'file', ROOT_ID))

496

>>> elt = inv.to_element()

497

>>> inv2 = Inventory.from_element(elt)

498

>>> inv2 == inv

499

True

500

"""

501

# XXXX: doctest doesn't run this properly under python2.3

502

assert elt.tag == 'inventory'

503

root_id = elt.get('file_id') or ROOT_ID

504

o = cls(root_id)

505

for e in elt:

506

ie = InventoryEntry.from_element(e)

507

if ie.parent_id == ROOT_ID:

508

ie.parent_id = root_id

509

o.add(ie)

510

return o

511

512

from_element = classmethod(from_element)

513

1076

if ie.parent_id is not None:

1077

del self[ie.parent_id].children[ie.name]

514

1078

515

1079

def __eq__(self, other):

516

1080

"""Compare two sets by comparing their contents.

519

1083

>>> i2 = Inventory()

520

1084

>>> i1 == i2

521

1085

True

522

>>> i1.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

1086

>>> i1.add(InventoryFile('123', 'foo', ROOT_ID))

1087

InventoryFile('123', 'foo', parent_id='TREE_ROOT')

523

1088

>>> i1 == i2

524

1089

False

525

>>> i2.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

1090

>>> i2.add(InventoryFile('123', 'foo', ROOT_ID))

1091

InventoryFile('123', 'foo', parent_id='TREE_ROOT')

526

1092

>>> i1 == i2

527

1093

True

528

1094

"""

535

1101

536

1102

return self._byid == other._byid

537

1103

538

539

1104

def __ne__(self, other):

540

return not (self == other)

541

1105

return not self.__eq__(other)

542

1106

543

1107

def __hash__(self):

544

1108

raise ValueError('not hashable')

545

1109

546

1110

def _iter_file_id_parents(self, file_id):

1111

"""Yield the parents of file_id up to the root."""

1112

while file_id != None:

1113

try:

1114

ie = self._byid[file_id]

1115

except KeyError:

1116

raise BzrError("file_id {%s} not found in inventory" % file_id)

1117

yield ie

1118

file_id = ie.parent_id

547

1119

548

1120

def get_idpath(self, file_id):

549

1121

"""Return a list of file_ids for the path to an entry.

554

1126

root directory as depth 1.

555

1127

"""

556

1128

p = []

557

while file_id != None:

558

try:

559

ie = self._byid[file_id]

560

except KeyError:

561

raise BzrError("file_id {%s} not found in inventory" % file_id)

562

p.insert(0, ie.file_id)

563

file_id = ie.parent_id

1129

for parent in self._iter_file_id_parents(file_id):

1130

p.insert(0, parent.file_id)

564

1131

return p

565

1132

566

567

1133

def id2path(self, file_id):

568

"""Return as a list the path to file_id."""

569

1134

"""Return as a string the path to file_id.

1135

1136

>>> i = Inventory()

1137

>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))

1138

>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))

1139

>>> print i.id2path('foo-id')

1140

src/foo.c

1141

"""

570

1142

# get all names, skipping root

571

p = [self._byid[fid].name for fid in self.get_idpath(file_id)[1:]]

572

return os.sep.join(p)

1143

return '/'.join(reversed(

1144

[parent.name for parent in

1145

self._iter_file_id_parents(file_id)][:-1]))

573

1146

574

575

576

1147

def path2id(self, name):

577

1148

"""Walk down through directories to return entry of last component.

578

1149

582

1153

This returns the entry of the last component in the path,

583

1154

which may be either a file or a directory.

584

1155

585

Returns None iff the path is not found.

1156

Returns None IFF the path is not found.

586

1157

"""

587

1158

if isinstance(name, types.StringTypes):

588

1159

name = splitpath(name)

589

1160

590

mutter("lookup path %r" % name)

1161

# mutter("lookup path %r" % name)

591

1162

592

1163

parent = self.root

593

1164

for f in name:

602

1173

603

1174

return parent.file_id

604

1175

605

606

1176

def has_filename(self, names):

607

1177

return bool(self.path2id(names))

608

1178

609

610

1179

def has_id(self, file_id):

611

1180

return self._byid.has_key(file_id)

612

1181

613

614

1182

def rename(self, file_id, new_parent_id, new_name):

615

1183

"""Move a file within the inventory.

616

1184

641

1209

file_ie.parent_id = new_parent_id

642

1210

643

1211

644

645

646

_NAME_RE = re.compile(r'^[^/\\]+$')

1212

def make_entry(kind, name, parent_id, file_id=None):

1213

"""Create an inventory entry.

1214

1215

:param kind: the type of inventory entry to create.

1216

:param name: the basename of the entry.

1217

:param parent_id: the parent_id of the entry.

1218

:param file_id: the file_id to use. if None, one will be created.

1219

"""

1220

if file_id is None:

1221

file_id = bzrlib.workingtree.gen_file_id(name)

1222

if kind == 'directory':

1223

return InventoryDirectory(file_id, name, parent_id)

1224

elif kind == 'file':

1225

return InventoryFile(file_id, name, parent_id)

1226

elif kind == 'symlink':

1227

return InventoryLink(file_id, name, parent_id)

1228

else:

1229

raise BzrError("unknown kind %r" % kind)

1230

1231

1232

1233

_NAME_RE = None

647

1234

648

1235

def is_valid_name(name):

1236

global _NAME_RE

1237

if _NAME_RE is None:

1238

_NAME_RE = re.compile(r'^[^/\\]+$')

1239

649

1240

return bool(_NAME_RE.match(name))

Older »