~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: Jelmer Vernooij
Date: 2006-06-21 13:54:14 UTC
mto: (1558.14.8 Aaron's integration)
mto: This revision was merged to the branch mainline in revision 1803.
Revision ID: jelmer@samba.org-20060621135414-11a3a70e53adbb99

Install benchmarks.

files added:
BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS.developers

bzrlib/annotate.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/read_bundle.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v07.py

bzrlib/bzrdir.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/identitymap.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_emptytree.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/pwclient.full

contrib/pwk

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

generate_docs.py

profile_imports.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

files removed:
bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/statcache.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/new-inventory-sample.xml

notes/performance.txt

patches

patches/find-touching-from-seq.diff

patches/symlink-support.patch

testbzr

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

bzrlib/store.py => bzrlib/store/__init__.py

bzrlib/selftest.py => bzrlib/tests/__init__.py

bzrlib/whitebox.py => bzrlib/tests/test_whitebox.py

elementtree/ => bzrlib/util/elementtree/

urlgrabber/ => bzrlib/util/urlgrabber/

bzrlib/xml.py => bzrlib/xml_serializer.py

bzrlib/newinventory.py => contrib/newinventory.py

bzr-man.py => tools/doc_generate/autodoc_man.py

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/revision.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/workingtree.py

contrib/add-bzr-to-baz

contrib/upload-bzr.dev

contrib/zsh/_bzr

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: This refactoring of the workingtree code doesn't seem to keep

# the WorkingTree's copy of the inventory in sync with the branch. The

# branch modifies its working inventory when it does a commit to make

# missing files permanently removed.

# TODO: Maybe also keep the full path of the entry, and the children?

# But those depend on its position within a particular inventory, and

# it would be nice not to need to hold the backpointer here.

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import sys, os.path, types, re

try:

from cElementTree import Element, ElementTree, SubElement

except ImportError:

from elementtree.ElementTree import Element, ElementTree, SubElement

from xml import XMLMixin

from errors import bailout, BzrError, BzrCheckError

import collections

import os.path

import re

import sys

import tarfile

import types

import bzrlib

from bzrlib.osutils import uuid, quotefn, splitpath, joinpath, appendpath

from bzrlib.osutils import (pumpfile, quotefn, splitpath, joinpath,

pathjoin, sha_strings)

from bzrlib.errors import (NotVersionedError, InvalidEntryName,

BzrError, BzrCheckError, BinaryFile)

from bzrlib.trace import mutter

class InventoryEntry(XMLMixin):

class InventoryEntry(object):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

* *file_id*

* *name*: (only the basename within the directory, must not

contain slashes)

* *kind*: "directory" or "file"

* *directory_id*: (if absent/null means the branch root directory)

* *text_sha1*: only for files

* *text_size*: in bytes, only for files

* *text_id*: identifier for the text version, only for files

InventoryEntries can also exist inside a WorkingTree

inventory, in which case they are not yet bound to a

particular revision of the file. In that case the text_sha1,

text_size and text_id are absent.

file_id

name

(within the parent directory)

parent_id

file_id of the parent directory, or ROOT_ID

revision

the revision_id in which this variation of this file was

introduced.

executable

Indicates that this file should be executable on systems

that support it.

text_sha1

sha-1 of the text of the file

text_size

size in bytes of the text of the file

(reading a version 4 tree created a text_id field.)

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryEntry('123', 'src', 'directory', ROOT_ID))

>>> i.add(InventoryEntry('2323', 'hello.c', 'file', parent_id='123'))

>>> for j in i.iter_entries():

... print j

>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))

InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None)

>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))

InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None)

>>> shouldbe = {0: 'src', 1: pathjoin('src','hello.c')}

>>> for ix, j in enumerate(i.iter_entries()):

... print (j[0] == shouldbe[ix], j[1])

...

('src', InventoryEntry('123', 'src', kind='directory', parent_id='TREE_ROOT'))

('src/hello.c', InventoryEntry('2323', 'hello.c', kind='file', parent_id='123'))

>>> i.add(InventoryEntry('2323', 'bye.c', 'file', '123'))

(True, InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None))

(True, InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None))

>>> i.add(InventoryFile('2323', 'bye.c', '123'))

Traceback (most recent call last):

...

BzrError: ('inventory already contains entry with id {2323}', [])

>>> i.add(InventoryEntry('2324', 'bye.c', 'file', '123'))

>>> i.add(InventoryEntry('2325', 'wibble', 'directory', '123'))

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryFile('2324', 'bye.c', '123'))

InventoryFile('2324', 'bye.c', parent_id='123', sha1=None, len=None)

>>> i.add(InventoryDirectory('2325', 'wibble', '123'))

InventoryDirectory('2325', 'wibble', parent_id='123', revision=None)

>>> i.path2id('src/wibble')

'2325'

>>> '2325' in i

100

True

>>> i.add(InventoryEntry('2326', 'wibble.c', 'file', '2325'))

101

>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))

102

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

103

>>> i['2326']

InventoryEntry('2326', 'wibble.c', kind='file', parent_id='2325')

>>> for j in i.iter_entries():

... print j[0]

... assert i.path2id(j[0])

104

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

105

>>> for path, entry in i.iter_entries():

106

... print path

107

... assert i.path2id(path)

108

...

109

src

110

src/bye.c

113

src/wibble/wibble.c

114

>>> i.id2path('2326')

115

'src/wibble/wibble.c'

TODO: Maybe also keep the full path of the entry, and the children?

But those depend on its position within a particular inventory, and

it would be nice not to need to hold the backpointer here.

116

"""

117

# TODO: split InventoryEntry into subclasses for files,

# directories, etc etc.

100

101

text_sha1 = None

102

text_size = None

118

# Constants returned by describe_change()

119

120

# TODO: These should probably move to some kind of FileChangeDescription

121

# class; that's like what's inside a TreeDelta but we want to be able to

122

# generate them just for one file at a time.

123

RENAMED = 'renamed'

124

MODIFIED_AND_RENAMED = 'modified and renamed'

103

125

104

def __init__(self, file_id, name, kind, parent_id, text_id=None):

126

__slots__ = []

127

128

def detect_changes(self, old_entry):

129

"""Return a (text_modified, meta_modified) from this to old_entry.

130

131

_read_tree_state must have been called on self and old_entry prior to

132

calling detect_changes.

133

"""

134

return False, False

135

136

def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

137

output_to, reverse=False):

138

"""Perform a diff from this to to_entry.

139

140

text_diff will be used for textual difference calculation.

141

This is a template method, override _diff in child classes.

142

"""

143

self._read_tree_state(tree.id2path(self.file_id), tree)

144

if to_entry:

145

# cannot diff from one kind to another - you must do a removal

146

# and an addif they do not match.

147

assert self.kind == to_entry.kind

148

to_entry._read_tree_state(to_tree.id2path(to_entry.file_id),

149

to_tree)

150

self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,

151

output_to, reverse)

152

153

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

154

output_to, reverse=False):

155

"""Perform a diff between two entries of the same kind."""

156

157

def find_previous_heads(self, previous_inventories,

158

versioned_file_store,

159

transaction,

160

entry_vf=None):

161

"""Return the revisions and entries that directly precede this.

162

163

Returned as a map from revision to inventory entry.

164

165

This is a map containing the file revisions in all parents

166

for which the file exists, and its revision is not a parent of

167

any other. If the file is new, the set will be empty.

168

169

:param versioned_file_store: A store where ancestry data on this

170

file id can be queried.

171

:param transaction: The transaction that queries to the versioned

172

file store should be completed under.

173

:param entry_vf: The entry versioned file, if its already available.

174

"""

175

def get_ancestors(weave, entry):

176

return set(weave.get_ancestry(entry.revision))

177

# revision:ie mapping for each ie found in previous_inventories.

178

candidates = {}

179

# revision:ie mapping with one revision for each head.

180

heads = {}

181

# revision: ancestor list for each head

182

head_ancestors = {}

183

# identify candidate head revision ids.

184

for inv in previous_inventories:

185

if self.file_id in inv:

186

ie = inv[self.file_id]

187

assert ie.file_id == self.file_id

188

if ie.revision in candidates:

189

# same revision value in two different inventories:

190

# correct possible inconsistencies:

191

# * there was a bug in revision updates with 'x' bit

192

# support.

193

try:

194

if candidates[ie.revision].executable != ie.executable:

195

candidates[ie.revision].executable = False

196

ie.executable = False

197

except AttributeError:

198

pass

199

# must now be the same.

200

assert candidates[ie.revision] == ie

201

else:

202

# add this revision as a candidate.

203

candidates[ie.revision] = ie

204

205

# common case optimisation

206

if len(candidates) == 1:

207

# if there is only one candidate revision found

208

# then we can opening the versioned file to access ancestry:

209

# there cannot be any ancestors to eliminate when there is

210

# only one revision available.

211

heads[ie.revision] = ie

212

return heads

213

214

# eliminate ancestors amongst the available candidates:

215

# heads are those that are not an ancestor of any other candidate

216

# - this provides convergence at a per-file level.

217

for ie in candidates.values():

218

# may be an ancestor of a known head:

219

already_present = 0 != len(

220

[head for head in heads

221

if ie.revision in head_ancestors[head]])

222

if already_present:

223

# an ancestor of an analyzed candidate.

224

continue

225

# not an ancestor of a known head:

226

# load the versioned file for this file id if needed

227

if entry_vf is None:

228

entry_vf = versioned_file_store.get_weave_or_empty(

229

self.file_id, transaction)

230

ancestors = get_ancestors(entry_vf, ie)

231

# may knock something else out:

232

check_heads = list(heads.keys())

233

for head in check_heads:

234

if head in ancestors:

235

# this previously discovered 'head' is not

236

# really a head - its an ancestor of the newly

237

# found head,

238

heads.pop(head)

239

head_ancestors[ie.revision] = ancestors

240

heads[ie.revision] = ie

241

return heads

242

243

def get_tar_item(self, root, dp, now, tree):

244

"""Get a tarfile item and a file stream for its content."""

245

item = tarfile.TarInfo(pathjoin(root, dp))

246

# TODO: would be cool to actually set it to the timestamp of the

247

# revision it was last changed

248

item.mtime = now

249

fileobj = self._put_in_tar(item, tree)

250

return item, fileobj

251

252

def has_text(self):

253

"""Return true if the object this entry represents has textual data.

254

255

Note that textual data includes binary content.

256

257

Also note that all entries get weave files created for them.

258

This attribute is primarily used when upgrading from old trees that

259

did not have the weave index for all inventory entries.

260

"""

261

return False

262

263

def __init__(self, file_id, name, parent_id, text_id=None):

105

264

"""Create an InventoryEntry

106

265

107

266

The filename must be a single component, relative to the

108

267

parent directory; it cannot be a whole path or relative name.

109

268

110

>>> e = InventoryEntry('123', 'hello.c', 'file', ROOT_ID)

269

>>> e = InventoryFile('123', 'hello.c', ROOT_ID)

111

270

>>> e.name

112

271

'hello.c'

113

272

>>> e.file_id

114

273

'123'

115

>>> e = InventoryEntry('123', 'src/hello.c', 'file', ROOT_ID)

274

>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)

116

275

Traceback (most recent call last):

117

BzrCheckError: InventoryEntry name 'src/hello.c' is invalid

276

InvalidEntryName: Invalid entry name: src/hello.c

118

277

"""

278

assert isinstance(name, basestring), name

119

279

if '/' in name or '\\' in name:

120

raise BzrCheckError('InventoryEntry name %r is invalid' % name)

121

280

raise InvalidEntryName(name=name)

281

self.executable = False

282

self.revision = None

283

self.text_sha1 = None

284

self.text_size = None

122

285

self.file_id = file_id

123

286

self.name = name

124

self.kind = kind

125

287

self.text_id = text_id

126

288

self.parent_id = parent_id

127

if kind == 'directory':

128

self.children = {}

129

elif kind == 'file':

130

pass

131

else:

132

raise BzrError("unhandled entry kind %r" % kind)

133

134

289

self.symlink_target = None

290

291

def kind_character(self):

292

"""Return a short kind indicator useful for appending to names."""

293

raise BzrError('unknown kind %r' % self.kind)

294

295

known_kinds = ('file', 'directory', 'symlink', 'root_directory')

296

297

def _put_in_tar(self, item, tree):

298

"""populate item for stashing in a tar, and return the content stream.

299

300

If no content is available, return None.

301

"""

302

raise BzrError("don't know how to export {%s} of kind %r" %

303

(self.file_id, self.kind))

304

305

def put_on_disk(self, dest, dp, tree):

306

"""Create a representation of self on disk in the prefix dest.

307

308

This is a template method - implement _put_on_disk in subclasses.

309

"""

310

fullpath = pathjoin(dest, dp)

311

self._put_on_disk(fullpath, tree)

312

mutter(" export {%s} kind %s to %s", self.file_id,

313

self.kind, fullpath)

314

315

def _put_on_disk(self, fullpath, tree):

316

"""Put this entry onto disk at fullpath, from tree tree."""

317

raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))

135

318

136

319

def sorted_children(self):

137

l = self.children.items()

138

l.sort()

139

return l

140

320

return sorted(self.children.items())

321

322

@staticmethod

323

def versionable_kind(kind):

324

return kind in ('file', 'directory', 'symlink')

325

326

def check(self, checker, rev_id, inv, tree):

327

"""Check this inventory entry is intact.

328

329

This is a template method, override _check for kind specific

330

tests.

331

332

:param checker: Check object providing context for the checks;

333

can be used to find out what parts of the repository have already

334

been checked.

335

:param rev_id: Revision id from which this InventoryEntry was loaded.

336

Not necessarily the last-changed revision for this file.

337

:param inv: Inventory from which the entry was loaded.

338

:param tree: RevisionTree for this entry.

339

"""

340

if self.parent_id is not None:

341

if not inv.has_id(self.parent_id):

342

raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'

343

% (self.parent_id, rev_id))

344

self._check(checker, rev_id, tree)

345

346

def _check(self, checker, rev_id, tree):

347

"""Check this inventory entry for kind specific errors."""

348

raise BzrCheckError('unknown entry kind %r in revision {%s}' %

349

(self.kind, rev_id))

141

350

142

351

def copy(self):

143

other = InventoryEntry(self.file_id, self.name, self.kind,

144

self.parent_id, text_id=self.text_id)

145

other.text_sha1 = self.text_sha1

146

other.text_size = self.text_size

147

# note that children are *not* copied; they're pulled across when

148

# others are added

149

return other

150

352

"""Clone this inventory entry."""

353

raise NotImplementedError

354

355

@staticmethod

356

def describe_change(old_entry, new_entry):

357

"""Describe the change between old_entry and this.

358

359

This smells of being an InterInventoryEntry situation, but as its

360

the first one, we're making it a static method for now.

361

362

An entry with a different parent, or different name is considered

363

to be renamed. Reparenting is an internal detail.

364

Note that renaming the parent does not trigger a rename for the

365

child entry itself.

366

"""

367

# TODO: Perhaps return an object rather than just a string

368

if old_entry is new_entry:

369

# also the case of both being None

370

return 'unchanged'

371

elif old_entry is None:

372

return 'added'

373

elif new_entry is None:

374

return 'removed'

375

text_modified, meta_modified = new_entry.detect_changes(old_entry)

376

if text_modified or meta_modified:

377

modified = True

378

else:

379

modified = False

380

# TODO 20060511 (mbp, rbc) factor out 'detect_rename' here.

381

if old_entry.parent_id != new_entry.parent_id:

382

renamed = True

383

elif old_entry.name != new_entry.name:

384

renamed = True

385

else:

386

renamed = False

387

if renamed and not modified:

388

return InventoryEntry.RENAMED

389

if modified and not renamed:

390

return 'modified'

391

if modified and renamed:

392

return InventoryEntry.MODIFIED_AND_RENAMED

393

return 'unchanged'

151

394

152

395

def __repr__(self):

153

return ("%s(%r, %r, kind=%r, parent_id=%r)"

396

return ("%s(%r, %r, parent_id=%r, revision=%r)"

154

397

% (self.__class__.__name__,

155

398

self.file_id,

156

399

self.name,

157

self.kind,

158

self.parent_id))

159

160

161

def to_element(self):

162

"""Convert to XML element"""

163

e = Element('entry')

164

165

e.set('name', self.name)

166

e.set('file_id', self.file_id)

167

e.set('kind', self.kind)

168

169

if self.text_size != None:

170

e.set('text_size', '%d' % self.text_size)

171

172

for f in ['text_id', 'text_sha1']:

173

v = getattr(self, f)

174

if v != None:

175

e.set(f, v)

176

177

# to be conservative, we don't externalize the root pointers

178

# for now, leaving them as null in the xml form. in a future

179

# version it will be implied by nested elements.

180

if self.parent_id != ROOT_ID:

181

assert isinstance(self.parent_id, basestring)

182

e.set('parent_id', self.parent_id)

183

184

e.tail = '\n'

185

186

return e

187

188

189

def from_element(cls, elt):

190

assert elt.tag == 'entry'

191

192

## original format inventories don't have a parent_id for

193

## nodes in the root directory, but it's cleaner to use one

194

## internally.

195

parent_id = elt.get('parent_id')

196

if parent_id == None:

197

parent_id = ROOT_ID

198

199

self = cls(elt.get('file_id'), elt.get('name'), elt.get('kind'), parent_id)

200

self.text_id = elt.get('text_id')

201

self.text_sha1 = elt.get('text_sha1')

202

203

## mutter("read inventoryentry: %r" % (elt.attrib))

204

205

v = elt.get('text_size')

206

self.text_size = v and int(v)

207

208

return self

209

210

211

from_element = classmethod(from_element)

400

self.parent_id,

401

self.revision))

402

403

def snapshot(self, revision, path, previous_entries,

404

work_tree, commit_builder):

405

"""Make a snapshot of this entry which may or may not have changed.

406

407

This means that all its fields are populated, that it has its

408

text stored in the text store or weave.

409

"""

410

mutter('new parents of %s are %r', path, previous_entries)

411

self._read_tree_state(path, work_tree)

412

# TODO: Where should we determine whether to reuse a

413

# previous revision id or create a new revision? 20060606

414

if len(previous_entries) == 1:

415

# cannot be unchanged unless there is only one parent file rev.

416

parent_ie = previous_entries.values()[0]

417

if self._unchanged(parent_ie):

418

mutter("found unchanged entry")

419

self.revision = parent_ie.revision

420

return "unchanged"

421

return self._snapshot_into_revision(revision, previous_entries,

422

work_tree, commit_builder)

423

424

def _snapshot_into_revision(self, revision, previous_entries, work_tree,

425

commit_builder):

426

"""Record this revision unconditionally into a store.

427

428

The entry's last-changed revision property (`revision`) is updated to

429

that of the new revision.

430

431

:param revision: id of the new revision that is being recorded.

432

433

:returns: String description of the commit (e.g. "merged", "modified"), etc.

434

"""

435

mutter('new revision {%s} for {%s}', revision, self.file_id)

436

self.revision = revision

437

self._snapshot_text(previous_entries, work_tree, commit_builder)

438

439

def _snapshot_text(self, file_parents, work_tree, commit_builder):

440

"""Record the 'text' of this entry, whatever form that takes.

441

442

This default implementation simply adds an empty text.

443

"""

444

raise NotImplementedError(self._snapshot_text)

212

445

213

446

def __eq__(self, other):

214

447

if not isinstance(other, InventoryEntry):

215

448

return NotImplemented

216

449

217

return (self.file_id == other.file_id) \

218

and (self.name == other.name) \

219

and (self.text_sha1 == other.text_sha1) \

220

and (self.text_size == other.text_size) \

221

and (self.text_id == other.text_id) \

222

and (self.parent_id == other.parent_id) \

223

and (self.kind == other.kind)

224

450

return ((self.file_id == other.file_id)

451

and (self.name == other.name)

452

and (other.symlink_target == self.symlink_target)

453

and (self.text_sha1 == other.text_sha1)

454

and (self.text_size == other.text_size)

455

and (self.text_id == other.text_id)

456

and (self.parent_id == other.parent_id)

457

and (self.kind == other.kind)

458

and (self.revision == other.revision)

459

and (self.executable == other.executable)

460

)

225

461

226

462

def __ne__(self, other):

227

463

return not (self == other)

229

465

def __hash__(self):

230

466

raise ValueError('not hashable')

231

467

468

def _unchanged(self, previous_ie):

469

"""Has this entry changed relative to previous_ie.

470

471

This method should be overridden in child classes.

472

"""

473

compatible = True

474

# different inv parent

475

if previous_ie.parent_id != self.parent_id:

476

compatible = False

477

# renamed

478

elif previous_ie.name != self.name:

479

compatible = False

480

return compatible

481

482

def _read_tree_state(self, path, work_tree):

483

"""Populate fields in the inventory entry from the given tree.

484

485

Note that this should be modified to be a noop on virtual trees

486

as all entries created there are prepopulated.

487

"""

488

# TODO: Rather than running this manually, we should check the

489

# working sha1 and other expensive properties when they're

490

# first requested, or preload them if they're already known

491

pass # nothing to do by default

492

493

def _forget_tree_state(self):

494

pass

232

495

233

496

234

497

class RootEntry(InventoryEntry):

498

499

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

500

'text_id', 'parent_id', 'children', 'executable',

501

'revision', 'symlink_target']

502

503

def _check(self, checker, rev_id, tree):

504

"""See InventoryEntry._check"""

505

235

506

def __init__(self, file_id):

236

507

self.file_id = file_id

237

508

self.children = {}

238

509

self.kind = 'root_directory'

239

510

self.parent_id = None

240

self.name = ''

511

self.name = u''

512

self.revision = None

241

513

242

514

def __eq__(self, other):

243

515

if not isinstance(other, RootEntry):

247

519

and (self.children == other.children)

248

520

249

521

250

251

class Inventory(XMLMixin):

522

class InventoryDirectory(InventoryEntry):

523

"""A directory in an inventory."""

524

525

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

526

'text_id', 'parent_id', 'children', 'executable',

527

'revision', 'symlink_target']

528

529

def _check(self, checker, rev_id, tree):

530

"""See InventoryEntry._check"""

531

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

532

raise BzrCheckError('directory {%s} has text in revision {%s}'

533

% (self.file_id, rev_id))

534

535

def copy(self):

536

other = InventoryDirectory(self.file_id, self.name, self.parent_id)

537

other.revision = self.revision

538

# note that children are *not* copied; they're pulled across when

539

# others are added

540

return other

541

542

def __init__(self, file_id, name, parent_id):

543

super(InventoryDirectory, self).__init__(file_id, name, parent_id)

544

self.children = {}

545

self.kind = 'directory'

546

547

def kind_character(self):

548

"""See InventoryEntry.kind_character."""

549

return '/'

550

551

def _put_in_tar(self, item, tree):

552

"""See InventoryEntry._put_in_tar."""

553

item.type = tarfile.DIRTYPE

554

fileobj = None

555

item.name += '/'

556

item.size = 0

557

item.mode = 0755

558

return fileobj

559

560

def _put_on_disk(self, fullpath, tree):

561

"""See InventoryEntry._put_on_disk."""

562

os.mkdir(fullpath)

563

564

def _snapshot_text(self, file_parents, work_tree, commit_builder):

565

"""See InventoryEntry._snapshot_text."""

566

commit_builder.modified_directory(self.file_id, file_parents)

567

568

569

class InventoryFile(InventoryEntry):

570

"""A file in an inventory."""

571

572

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

573

'text_id', 'parent_id', 'children', 'executable',

574

'revision', 'symlink_target']

575

576

def _check(self, checker, tree_revision_id, tree):

577

"""See InventoryEntry._check"""

578

t = (self.file_id, self.revision)

579

if t in checker.checked_texts:

580

prev_sha = checker.checked_texts[t]

581

if prev_sha != self.text_sha1:

582

raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %

583

(self.file_id, tree_revision_id))

584

else:

585

checker.repeated_text_cnt += 1

586

return

587

588

if self.file_id not in checker.checked_weaves:

589

mutter('check weave {%s}', self.file_id)

590

w = tree.get_weave(self.file_id)

591

# Not passing a progress bar, because it creates a new

592

# progress, which overwrites the current progress,

593

# and doesn't look nice

594

w.check()

595

checker.checked_weaves[self.file_id] = True

596

else:

597

w = tree.get_weave(self.file_id)

598

599

mutter('check version {%s} of {%s}', tree_revision_id, self.file_id)

600

checker.checked_text_cnt += 1

601

# We can't check the length, because Weave doesn't store that

602

# information, and the whole point of looking at the weave's

603

# sha1sum is that we don't have to extract the text.

604

if self.text_sha1 != w.get_sha1(self.revision):

605

raise BzrCheckError('text {%s} version {%s} wrong sha1'

606

% (self.file_id, self.revision))

607

checker.checked_texts[t] = self.text_sha1

608

609

def copy(self):

610

other = InventoryFile(self.file_id, self.name, self.parent_id)

611

other.executable = self.executable

612

other.text_id = self.text_id

613

other.text_sha1 = self.text_sha1

614

other.text_size = self.text_size

615

other.revision = self.revision

616

return other

617

618

def detect_changes(self, old_entry):

619

"""See InventoryEntry.detect_changes."""

620

assert self.text_sha1 is not None

621

assert old_entry.text_sha1 is not None

622

text_modified = (self.text_sha1 != old_entry.text_sha1)

623

meta_modified = (self.executable != old_entry.executable)

624

return text_modified, meta_modified

625

626

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

627

output_to, reverse=False):

628

"""See InventoryEntry._diff."""

629

try:

630

from_text = tree.get_file(self.file_id).readlines()

631

if to_entry:

632

to_text = to_tree.get_file(to_entry.file_id).readlines()

633

else:

634

to_text = []

635

if not reverse:

636

text_diff(from_label, from_text,

637

to_label, to_text, output_to)

638

else:

639

text_diff(to_label, to_text,

640

from_label, from_text, output_to)

641

except BinaryFile:

642

if reverse:

643

label_pair = (to_label, from_label)

644

else:

645

label_pair = (from_label, to_label)

646

print >> output_to, "Binary files %s and %s differ" % label_pair

647

648

def has_text(self):

649

"""See InventoryEntry.has_text."""

650

return True

651

652

def __init__(self, file_id, name, parent_id):

653

super(InventoryFile, self).__init__(file_id, name, parent_id)

654

self.kind = 'file'

655

656

def kind_character(self):

657

"""See InventoryEntry.kind_character."""

658

return ''

659

660

def _put_in_tar(self, item, tree):

661

"""See InventoryEntry._put_in_tar."""

662

item.type = tarfile.REGTYPE

663

fileobj = tree.get_file(self.file_id)

664

item.size = self.text_size

665

if tree.is_executable(self.file_id):

666

item.mode = 0755

667

else:

668

item.mode = 0644

669

return fileobj

670

671

def _put_on_disk(self, fullpath, tree):

672

"""See InventoryEntry._put_on_disk."""

673

pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))

674

if tree.is_executable(self.file_id):

675

os.chmod(fullpath, 0755)

676

677

def _read_tree_state(self, path, work_tree):

678

"""See InventoryEntry._read_tree_state."""

679

self.text_sha1 = work_tree.get_file_sha1(self.file_id, path=path)

680

# FIXME: 20050930 probe for the text size when getting sha1

681

# in _read_tree_state

682

self.executable = work_tree.is_executable(self.file_id, path=path)

683

684

def __repr__(self):

685

return ("%s(%r, %r, parent_id=%r, sha1=%r, len=%s)"

686

% (self.__class__.__name__,

687

self.file_id,

688

self.name,

689

self.parent_id,

690

self.text_sha1,

691

self.text_size))

692

693

def _forget_tree_state(self):

694

self.text_sha1 = None

695

self.executable = None

696

697

def _snapshot_text(self, file_parents, work_tree, commit_builder):

698

"""See InventoryEntry._snapshot_text."""

699

def get_content_byte_lines():

700

return work_tree.get_file(self.file_id).readlines()

701

self.text_sha1, self.text_size = commit_builder.modified_file_text(

702

self.file_id, file_parents, get_content_byte_lines, self.text_sha1, self.text_size)

703

704

def _unchanged(self, previous_ie):

705

"""See InventoryEntry._unchanged."""

706

compatible = super(InventoryFile, self)._unchanged(previous_ie)

707

if self.text_sha1 != previous_ie.text_sha1:

708

compatible = False

709

else:

710

# FIXME: 20050930 probe for the text size when getting sha1

711

# in _read_tree_state

712

self.text_size = previous_ie.text_size

713

if self.executable != previous_ie.executable:

714

compatible = False

715

return compatible

716

717

718

class InventoryLink(InventoryEntry):

719

"""A file in an inventory."""

720

721

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

722

'text_id', 'parent_id', 'children', 'executable',

723

'revision', 'symlink_target']

724

725

def _check(self, checker, rev_id, tree):

726

"""See InventoryEntry._check"""

727

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

728

raise BzrCheckError('symlink {%s} has text in revision {%s}'

729

% (self.file_id, rev_id))

730

if self.symlink_target is None:

731

raise BzrCheckError('symlink {%s} has no target in revision {%s}'

732

% (self.file_id, rev_id))

733

734

def copy(self):

735

other = InventoryLink(self.file_id, self.name, self.parent_id)

736

other.symlink_target = self.symlink_target

737

other.revision = self.revision

738

return other

739

740

def detect_changes(self, old_entry):

741

"""See InventoryEntry.detect_changes."""

742

# FIXME: which _modified field should we use ? RBC 20051003

743

text_modified = (self.symlink_target != old_entry.symlink_target)

744

if text_modified:

745

mutter(" symlink target changed")

746

meta_modified = False

747

return text_modified, meta_modified

748

749

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

750

output_to, reverse=False):

751

"""See InventoryEntry._diff."""

752

from_text = self.symlink_target

753

if to_entry is not None:

754

to_text = to_entry.symlink_target

755

if reverse:

756

temp = from_text

757

from_text = to_text

758

to_text = temp

759

print >>output_to, '=== target changed %r => %r' % (from_text, to_text)

760

else:

761

if not reverse:

762

print >>output_to, '=== target was %r' % self.symlink_target

763

else:

764

print >>output_to, '=== target is %r' % self.symlink_target

765

766

def __init__(self, file_id, name, parent_id):

767

super(InventoryLink, self).__init__(file_id, name, parent_id)

768

self.kind = 'symlink'

769

770

def kind_character(self):

771

"""See InventoryEntry.kind_character."""

772

return ''

773

774

def _put_in_tar(self, item, tree):

775

"""See InventoryEntry._put_in_tar."""

776

item.type = tarfile.SYMTYPE

777

fileobj = None

778

item.size = 0

779

item.mode = 0755

780

item.linkname = self.symlink_target

781

return fileobj

782

783

def _put_on_disk(self, fullpath, tree):

784

"""See InventoryEntry._put_on_disk."""

785

try:

786

os.symlink(self.symlink_target, fullpath)

787

except OSError,e:

788

raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))

789

790

def _read_tree_state(self, path, work_tree):

791

"""See InventoryEntry._read_tree_state."""

792

self.symlink_target = work_tree.get_symlink_target(self.file_id)

793

794

def _forget_tree_state(self):

795

self.symlink_target = None

796

797

def _unchanged(self, previous_ie):

798

"""See InventoryEntry._unchanged."""

799

compatible = super(InventoryLink, self)._unchanged(previous_ie)

800

if self.symlink_target != previous_ie.symlink_target:

801

compatible = False

802

return compatible

803

804

def _snapshot_text(self, file_parents, work_tree, commit_builder):

805

"""See InventoryEntry._snapshot_text."""

806

commit_builder.modified_link(

807

self.file_id, file_parents, self.symlink_target)

808

809

810

class Inventory(object):

252

811

"""Inventory of versioned files in a tree.

253

812

254

813

This describes which file_id is present at each point in the tree,

266

825

inserted, other than through the Inventory API.

267

826

268

827

>>> inv = Inventory()

269

>>> inv.write_xml(sys.stdout)

270

271

</inventory>

272

>>> inv.add(InventoryEntry('123-123', 'hello.c', 'file', ROOT_ID))

828

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

829

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

273

830

>>> inv['123-123'].name

274

831

'hello.c'

275

832

283

840

May also look up by name:

284

841

285

842

>>> [x[0] for x in inv.iter_entries()]

286

['hello.c']

287

288

>>> inv.write_xml(sys.stdout)

289

290

291

</inventory>

292

843

[u'hello.c']

844

>>> inv = Inventory('TREE_ROOT-12345678-12345678')

845

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

846

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT-12345678-12345678', sha1=None, len=None)

293

847

"""

294

def __init__(self):

848

def __init__(self, root_id=ROOT_ID, revision_id=None):

295

849

"""Create or read an inventory.

296

850

297

851

If a working directory is specified, the inventory is read

301

855

The inventory is created with a default root directory, with

302

856

an id of None.

303

857

"""

304

self.root = RootEntry(ROOT_ID)

858

# We are letting Branch.create() create a unique inventory

859

# root id. Rather than generating a random one here.

860

#if root_id is None:

861

# root_id = bzrlib.branch.gen_file_id('TREE_ROOT')

862

self.root = RootEntry(root_id)

863

# FIXME: this isn't ever used, changing it to self.revision may break

864

# things. TODO make everything use self.revision_id

865

self.revision_id = revision_id

305

866

self._byid = {self.root.file_id: self.root}

306

867

868

def copy(self):

869

# TODO: jam 20051218 Should copy also copy the revision_id?

870

other = Inventory(self.root.file_id)

871

# copy recursively so we know directories will be added before

872

# their children. There are more efficient ways than this...

873

for path, entry in self.iter_entries():

874

if entry == self.root:

875

continue

876

other.add(entry.copy())

877

return other

307

878

308

879

def __iter__(self):

309

880

return iter(self._byid)

310

881

311

312

882

def __len__(self):

313

883

"""Returns number of entries."""

314

884

return len(self._byid)

315

885

316

317

886

def iter_entries(self, from_dir=None):

318

887

"""Return (path, entry) pairs, in order by name."""

319

if from_dir == None:

320

assert self.root

321

from_dir = self.root

322

elif isinstance(from_dir, basestring):

323

from_dir = self._byid[from_dir]

324

325

kids = from_dir.children.items()

326

kids.sort()

327

for name, ie in kids:

328

yield name, ie

329

if ie.kind == 'directory':

330

for cn, cie in self.iter_entries(from_dir=ie.file_id):

331

yield os.path.join(name, cn), cie

332

888

if from_dir is None:

889

assert self.root

890

from_dir = self.root

891

elif isinstance(from_dir, basestring):

892

from_dir = self._byid[from_dir]

893

894

# unrolling the recursive called changed the time from

895

# 440ms/663ms (inline/total) to 116ms/116ms

896

children = from_dir.children.items()

897

children.sort()

898

children = collections.deque(children)

899

stack = [(u'', children)]

900

while stack:

901

from_dir_relpath, children = stack[-1]

902

903

while children:

904

name, ie = children.popleft()

905

906

# we know that from_dir_relpath never ends in a slash

907

# and 'f' doesn't begin with one, we can do a string op, rather

908

# than the checks of pathjoin(), though this means that all paths

909

# start with a slash

910

path = from_dir_relpath + '/' + name

911

912

yield path[1:], ie

913

914

if ie.kind != 'directory':

915

continue

916

917

# But do this child first

918

new_children = ie.children.items()

919

new_children.sort()

920

new_children = collections.deque(new_children)

921

stack.append((path, new_children))

922

# Break out of inner loop, so that we start outer loop with child

923

break

924

else:

925

# if we finished all children, pop it off the stack

926

stack.pop()

927

928

def iter_entries_by_dir(self, from_dir=None):

929

"""Iterate over the entries in a directory first order.

930

931

This returns all entries for a directory before returning

932

the entries for children of a directory. This is not

933

lexicographically sorted order, and is a hybrid between

934

depth-first and breadth-first.

935

936

:return: This yields (path, entry) pairs

937

"""

938

# TODO? Perhaps this should return the from_dir so that the root is

939

# yielded? or maybe an option?

940

if from_dir is None:

941

assert self.root

942

from_dir = self.root

943

elif isinstance(from_dir, basestring):

944

from_dir = self._byid[from_dir]

945

946

stack = [(u'', from_dir)]

947

while stack:

948

cur_relpath, cur_dir = stack.pop()

949

950

child_dirs = []

951

for child_name, child_ie in sorted(cur_dir.children.iteritems()):

952

953

child_relpath = cur_relpath + child_name

954

955

yield child_relpath, child_ie

956

957

if child_ie.kind == 'directory':

958

child_dirs.append((child_relpath+'/', child_ie))

959

stack.extend(reversed(child_dirs))

333

960

334

961

def entries(self):

335

962

"""Return list of (path, ie) for all entries except the root.

341

968

kids = dir_ie.children.items()

342

969

kids.sort()

343

970

for name, ie in kids:

344

child_path = os.path.join(dir_path, name)

971

child_path = pathjoin(dir_path, name)

345

972

accum.append((child_path, ie))

346

973

if ie.kind == 'directory':

347

974

descend(ie, child_path)

348

975

349

descend(self.root, '')

976

descend(self.root, u'')

350

977

return accum

351

978

352

353

979

def directories(self):

354

980

"""Return (path, entry) pairs for all directories, including the root.

355

981

"""

361

987

kids.sort()

362

988

363

989

for name, child_ie in kids:

364

child_path = os.path.join(parent_path, name)

990

child_path = pathjoin(parent_path, name)

365

991

descend(child_ie, child_path)

366

descend(self.root, '')

992

descend(self.root, u'')

367

993

return accum

368

994

369

370

371

995

def __contains__(self, file_id):

372

996

"""True if this entry contains a file with given id.

373

997

374

998

>>> inv = Inventory()

375

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

999

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1000

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

376

1001

>>> '123' in inv

377

1002

True

378

1003

>>> '456' in inv

380

1005

"""

381

1006

return file_id in self._byid

382

1007

383

384

1008

def __getitem__(self, file_id):

385

1009

"""Return the entry for given file_id.

386

1010

387

1011

>>> inv = Inventory()

388

>>> inv.add(InventoryEntry('123123', 'hello.c', 'file', ROOT_ID))

1012

>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))

1013

InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

389

1014

>>> inv['123123'].name

390

1015

'hello.c'

391

1016

"""

392

1017

try:

393

1018

return self._byid[file_id]

394

1019

except KeyError:

395

if file_id == None:

1020

if file_id is None:

396

1021

raise BzrError("can't look up file_id None")

397

1022

else:

398

1023

raise BzrError("file_id {%s} not in inventory" % file_id)

399

1024

400

401

1025

def get_file_kind(self, file_id):

402

1026

return self._byid[file_id].kind

403

1027

404

1028

def get_child(self, parent_id, filename):

405

1029

return self[parent_id].children.get(filename)

406

1030

407

408

1031

def add(self, entry):

409

1032

"""Add entry to inventory.

410

1033

411

1034

To add a file to a branch ready to be committed, use Branch.add,

412

which calls this."""

1035

which calls this.

1036

1037

Returns the new entry object.

1038

"""

413

1039

if entry.file_id in self._byid:

414

bailout("inventory already contains entry with id {%s}" % entry.file_id)

1040

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

1041

1042

if entry.parent_id == ROOT_ID or entry.parent_id is None:

1043

entry.parent_id = self.root.file_id

415

1044

416

1045

try:

417

1046

parent = self._byid[entry.parent_id]

418

1047

except KeyError:

419

bailout("parent_id {%s} not in inventory" % entry.parent_id)

1048

raise BzrError("parent_id {%s} not in inventory" % entry.parent_id)

420

1049

421

if parent.children.has_key(entry.name):

422

bailout("%s is already versioned" %

423

appendpath(self.id2path(parent.file_id), entry.name))

1050

if entry.name in parent.children:

1051

raise BzrError("%s is already versioned" %

1052

pathjoin(self.id2path(parent.file_id), entry.name))

424

1053

425

1054

self._byid[entry.file_id] = entry

426

1055

parent.children[entry.name] = entry

427

428

429

def add_path(self, relpath, kind, file_id=None):

1056

return entry

1057

1058

def add_path(self, relpath, kind, file_id=None, parent_id=None):

430

1059

"""Add entry from a path.

431

1060

432

The immediate parent must already be versioned"""

1061

The immediate parent must already be versioned.

1062

1063

Returns the new entry object."""

1064

433

1065

parts = bzrlib.osutils.splitpath(relpath)

1066

434

1067

if len(parts) == 0:

435

bailout("cannot re-add root of inventory")

436

437

if file_id == None:

438

file_id = bzrlib.branch.gen_file_id(relpath)

439

440

parent_id = self.path2id(parts[:-1])

441

assert parent_id != None

442

ie = InventoryEntry(file_id, parts[-1],

443

kind=kind, parent_id=parent_id)

1068

if file_id is None:

1069

file_id = bzrlib.workingtree.gen_root_id()

1070

self.root = RootEntry(file_id)

1071

self._byid = {self.root.file_id: self.root}

1072

return

1073

else:

1074

parent_path = parts[:-1]

1075

parent_id = self.path2id(parent_path)

1076

if parent_id is None:

1077

raise NotVersionedError(path=parent_path)

1078

ie = make_entry(kind, parts[-1], parent_id, file_id)

444

1079

return self.add(ie)

445

1080

446

447

1081

def __delitem__(self, file_id):

448

1082

"""Remove entry by id.

449

1083

450

1084

>>> inv = Inventory()

451

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

1085

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1086

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

452

1087

>>> '123' in inv

453

1088

True

454

1089

>>> del inv['123']

457

1092

"""

458

1093

ie = self[file_id]

459

1094

460

assert self[ie.parent_id].children[ie.name] == ie

1095

assert ie.parent_id is None or \

1096

self[ie.parent_id].children[ie.name] == ie

461

1097

462

# TODO: Test deleting all children; maybe hoist to a separate

463

# deltree method?

464

if ie.kind == 'directory':

465

for cie in ie.children.values():

466

del self[cie.file_id]

467

del ie.children

468

469

1098

del self._byid[file_id]

470

del self[ie.parent_id].children[ie.name]

471

472

473

def to_element(self):

474

"""Convert to XML Element"""

475

e = Element('inventory')

476

e.text = '\n'

477

for path, ie in self.iter_entries():

478

e.append(ie.to_element())

479

return e

480

481

482

def from_element(cls, elt):

483

"""Construct from XML Element

484

485

>>> inv = Inventory()

486

>>> inv.add(InventoryEntry('foo.c-123981239', 'foo.c', 'file', ROOT_ID))

487

>>> elt = inv.to_element()

488

>>> inv2 = Inventory.from_element(elt)

489

>>> inv2 == inv

490

True

491

"""

492

assert elt.tag == 'inventory'

493

o = cls()

494

for e in elt:

495

o.add(InventoryEntry.from_element(e))

496

return o

497

498

from_element = classmethod(from_element)

499

1099

if ie.parent_id is not None:

1100

del self[ie.parent_id].children[ie.name]

500

1101

501

1102

def __eq__(self, other):

502

1103

"""Compare two sets by comparing their contents.

505

1106

>>> i2 = Inventory()

506

1107

>>> i1 == i2

507

1108

True

508

>>> i1.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

1109

>>> i1.add(InventoryFile('123', 'foo', ROOT_ID))

1110

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

509

1111

>>> i1 == i2

510

1112

False

511

>>> i2.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

1113

>>> i2.add(InventoryFile('123', 'foo', ROOT_ID))

1114

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

512

1115

>>> i1 == i2

513

1116

True

514

1117

"""

515

1118

if not isinstance(other, Inventory):

516

1119

return NotImplemented

517

1120

518

if len(self._byid) != len(other._byid):

519

# shortcut: obviously not the same

520

return False

521

522

1121

return self._byid == other._byid

523

1122

524

525

1123

def __ne__(self, other):

526

return not (self == other)

527

1124

return not self.__eq__(other)

528

1125

529

1126

def __hash__(self):

530

1127

raise ValueError('not hashable')

531

1128

532

1129

def _iter_file_id_parents(self, file_id):

1130

"""Yield the parents of file_id up to the root."""

1131

while file_id is not None:

1132

try:

1133

ie = self._byid[file_id]

1134

except KeyError:

1135

raise BzrError("file_id {%s} not found in inventory" % file_id)

1136

yield ie

1137

file_id = ie.parent_id

533

1138

534

1139

def get_idpath(self, file_id):

535

1140

"""Return a list of file_ids for the path to an entry.

540

1145

root directory as depth 1.

541

1146

"""

542

1147

p = []

543

while file_id != None:

544

try:

545

ie = self._byid[file_id]

546

except KeyError:

547

bailout("file_id {%s} not found in inventory" % file_id)

548

p.insert(0, ie.file_id)

549

file_id = ie.parent_id

1148

for parent in self._iter_file_id_parents(file_id):

1149

p.insert(0, parent.file_id)

550

1150

return p

551

1151

552

553

1152

def id2path(self, file_id):

554

"""Return as a list the path to file_id."""

555

1153

"""Return as a string the path to file_id.

1154

1155

>>> i = Inventory()

1156

>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))

1157

>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))

1158

>>> print i.id2path('foo-id')

1159

src/foo.c

1160

"""

556

1161

# get all names, skipping root

557

p = [self[fid].name for fid in self.get_idpath(file_id)[1:]]

558

return os.sep.join(p)

1162

return '/'.join(reversed(

1163

[parent.name for parent in

1164

self._iter_file_id_parents(file_id)][:-1]))

559

1165

560

561

562

1166

def path2id(self, name):

563

1167

"""Walk down through directories to return entry of last component.

564

1168

568

1172

This returns the entry of the last component in the path,

569

1173

which may be either a file or a directory.

570

1174

571

Returns None iff the path is not found.

1175

Returns None IFF the path is not found.

572

1176

"""

573

1177

if isinstance(name, types.StringTypes):

574

1178

name = splitpath(name)

575

1179

576

mutter("lookup path %r" % name)

1180

# mutter("lookup path %r" % name)

577

1181

578

1182

parent = self.root

579

1183

for f in name:

588

1192

589

1193

return parent.file_id

590

1194

591

592

1195

def has_filename(self, names):

593

1196

return bool(self.path2id(names))

594

1197

595

596

1198

def has_id(self, file_id):

597

1199

return self._byid.has_key(file_id)

598

1200

599

600

1201

def rename(self, file_id, new_parent_id, new_name):

601

1202

"""Move a file within the inventory.

602

1203

604

1205

605

1206

This does not move the working file."""

606

1207

if not is_valid_name(new_name):

607

bailout("not an acceptable filename: %r" % new_name)

1208

raise BzrError("not an acceptable filename: %r" % new_name)

608

1209

609

1210

new_parent = self._byid[new_parent_id]

610

1211

if new_name in new_parent.children:

611

bailout("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

1212

raise BzrError("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

612

1213

613

1214

new_parent_idpath = self.get_idpath(new_parent_id)

614

1215

if file_id in new_parent_idpath:

615

bailout("cannot move directory %r into a subdirectory of itself, %r"

1216

raise BzrError("cannot move directory %r into a subdirectory of itself, %r"

616

1217

% (self.id2path(file_id), self.id2path(new_parent_id)))

617

1218

618

1219

file_ie = self._byid[file_id]

627

1228

file_ie.parent_id = new_parent_id

628

1229

629

1230

630

631

632

_NAME_RE = re.compile(r'^[^/\\]+$')

1231

def make_entry(kind, name, parent_id, file_id=None):

1232

"""Create an inventory entry.

1233

1234

:param kind: the type of inventory entry to create.

1235

:param name: the basename of the entry.

1236

:param parent_id: the parent_id of the entry.

1237

:param file_id: the file_id to use. if None, one will be created.

1238

"""

1239

if file_id is None:

1240

file_id = bzrlib.workingtree.gen_file_id(name)

1241

if kind == 'directory':

1242

return InventoryDirectory(file_id, name, parent_id)

1243

elif kind == 'file':

1244

return InventoryFile(file_id, name, parent_id)

1245

elif kind == 'symlink':

1246

return InventoryLink(file_id, name, parent_id)

1247

else:

1248

raise BzrError("unknown kind %r" % kind)

1249

1250

1251

1252

_NAME_RE = None

633

1253

634

1254

def is_valid_name(name):

1255

global _NAME_RE

1256

if _NAME_RE is None:

1257

_NAME_RE = re.compile(r'^[^/\\]+$')

1258

635

1259

return bool(_NAME_RE.match(name))

Older »