~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: Andrew Bennetts
Date: 2007-10-05 05:52:45 UTC
mfrom: (2890 +trunk)
mto: (2535.4.11 streaming-smart-fetch)
mto: This revision was merged to the branch mainline in revision 2906.
Revision ID: andrew.bennetts@canonical.com-20071005055245-5f8ldcqxp21zy8v8

Merge from bzr.dev.

files added:
bzrlib/_patiencediff_c.c

bzrlib/benchmarks/bench_pack.py

bzrlib/patiencediff.py

bzrlib/reconfigure.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/transport/trace.py

doc/developers/authentication-ring.txt

files renamed:
bzrlib/patiencediff.py => bzrlib/_patiencediff_py.py

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/debug.py

bzrlib/dirstate.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/help_topics.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/store/revision/knit.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/HttpServer.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tuned_gzip.py

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/en/user-guide/configuration.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

BzrCheckError,

BzrError,

)

from bzrlib.symbol_versioning import deprecated_method, zero_ninetyone

from bzrlib.trace import mutter

161

162

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

162

163

output_to, reverse=False):

163

164

"""Perform a diff between two entries of the same kind."""

164

165

def find_previous_heads(self, previous_inventories,

166

versioned_file_store,

167

transaction,

168

entry_vf=None):

169

"""Return the revisions and entries that directly precede this.

170

171

Returned as a map from revision to inventory entry.

172

173

This is a map containing the file revisions in all parents

174

for which the file exists, and its revision is not a parent of

175

any other. If the file is new, the set will be empty.

176

177

:param versioned_file_store: A store where ancestry data on this

178

file id can be queried.

179

:param transaction: The transaction that queries to the versioned

180

file store should be completed under.

181

:param entry_vf: The entry versioned file, if its already available.

165

166

def parent_candidates(self, previous_inventories):

167

"""Find possible per-file graph parents.

168

169

This is currently defined by:

170

- Select the last changed revision in the parent inventory.

171

- Do deal with a short lived bug in bzr 0.8's development two entries

172

that have the same last changed but different 'x' bit settings are

173

changed in-place.

182

174

"""

183

def get_ancestors(weave, entry):

184

return set(weave.get_ancestry(entry.revision, topo_sorted=False))

185

175

# revision:ie mapping for each ie found in previous_inventories.

186

176

candidates = {}

187

# revision:ie mapping with one revision for each head.

188

heads = {}

189

# revision: ancestor list for each head

190

head_ancestors = {}

191

177

# identify candidate head revision ids.

192

178

for inv in previous_inventories:

193

179

if self.file_id in inv:

194

180

ie = inv[self.file_id]

195

181

assert ie.file_id == self.file_id

196

if ie.kind != self.kind:

197

# Can't be a candidate if the kind has changed.

198

continue

199

182

if ie.revision in candidates:

200

183

# same revision value in two different inventories:

201

184

# correct possible inconsistencies:

212

195

else:

213

196

# add this revision as a candidate.

214

197

candidates[ie.revision] = ie

215

198

return candidates

199

200

@deprecated_method(zero_ninetyone)

201

def find_previous_heads(self, previous_inventories,

202

versioned_file_store,

203

transaction,

204

entry_vf=None):

205

"""Return the revisions and entries that directly precede this.

206

207

Returned as a map from revision to inventory entry.

208

209

This is a map containing the file revisions in all parents

210

for which the file exists, and its revision is not a parent of

211

any other. If the file is new, the set will be empty.

212

213

:param versioned_file_store: A store where ancestry data on this

214

file id can be queried.

215

:param transaction: The transaction that queries to the versioned

216

file store should be completed under.

217

:param entry_vf: The entry versioned file, if its already available.

218

"""

219

candidates = self.parent_candidates(previous_inventories)

220

221

# revision:ie mapping with one revision for each head.

222

heads = {}

216

223

# common case optimisation

217

224

if len(candidates) == 1:

218

225

# if there is only one candidate revision found

219

# then we can opening the versioned file to access ancestry:

226

# then we can avoid opening the versioned file to access ancestry:

220

227

# there cannot be any ancestors to eliminate when there is

221

228

# only one revision available.

222

heads[ie.revision] = ie

223

return heads

229

return candidates

230

231

# --- what follows is now encapsulated in repository.get_graph.heads(),

232

# but that is not accessible from here as we have no repository

233

# pointer. Note that the repository.get_graph.heads() call can return

234

# different results *at the moment* because of the kind-changing check

235

# we have in parent_candidates().

224

236

225

237

# eliminate ancestors amongst the available candidates:

226

238

# heads are those that are not an ancestor of any other candidate

227

239

# - this provides convergence at a per-file level.

240

def get_ancestors(weave, entry):

241

return set(weave.get_ancestry(entry.revision, topo_sorted=False))

242

# revision: ancestor list for each head

243

head_ancestors = {}

228

244

for ie in candidates.values():

229

245

# may be an ancestor of a known head:

230

246

already_present = 0 != len(

416

432

self.parent_id,

417

433

self.revision))

418

434

419

def snapshot(self, revision, path, previous_entries,

420

work_tree, commit_builder):

421

"""Make a snapshot of this entry which may or may not have changed.

422

423

This means that all its fields are populated, that it has its

424

text stored in the text store or weave.

425

426

:return: True if anything was recorded

427

"""

428

# cannot be unchanged unless there is only one parent file rev.

429

self._read_tree_state(path, work_tree)

430

if len(previous_entries) == 1:

431

parent_ie = previous_entries.values()[0]

432

if self._unchanged(parent_ie):

433

self.revision = parent_ie.revision

434

return False

435

self.revision = revision

436

return self._snapshot_text(previous_entries, work_tree, commit_builder)

437

438

def _snapshot_text(self, file_parents, work_tree, commit_builder):

439

"""Record the 'text' of this entry, whatever form that takes.

440

441

:return: True if anything was recorded

442

"""

443

raise NotImplementedError(self._snapshot_text)

444

445

435

def __eq__(self, other):

446

436

if not isinstance(other, InventoryEntry):

447

437

return NotImplemented

566

556

"""See InventoryEntry._put_on_disk."""

567

557

os.mkdir(fullpath)

568

558

569

def _snapshot_text(self, file_parents, work_tree, commit_builder):

570

"""See InventoryEntry._snapshot_text."""

571

commit_builder.modified_directory(self.file_id, file_parents)

572

return True

573

574

559

575

560

class InventoryFile(InventoryEntry):

576

561

"""A file in an inventory."""

700

685

def _forget_tree_state(self):

701

686

self.text_sha1 = None

702

687

703

def snapshot(self, revision, path, previous_entries,

704

work_tree, commit_builder):

705

"""See InventoryEntry.snapshot."""

706

# Note: We use a custom implementation of this method for files

707

# because it's a performance critical part of commit.

708

709

# If this is the initial commit for this file, we know the sha is

710

# coming later so skip calculating it now (in _read_tree_state())

711

if len(previous_entries) == 0:

712

self.executable = work_tree.is_executable(self.file_id, path=path)

713

else:

714

self._read_tree_state(path, work_tree)

715

716

# If nothing is changed from the sole parent, there's nothing to do

717

if len(previous_entries) == 1:

718

parent_ie = previous_entries.values()[0]

719

if self._unchanged(parent_ie):

720

self.revision = parent_ie.revision

721

return False

722

723

# Add the file to the repository

724

self.revision = revision

725

def get_content_byte_lines():

726

return work_tree.get_file(self.file_id, path).readlines()

727

self.text_sha1, self.text_size = commit_builder.modified_file_text(

728

self.file_id, previous_entries, get_content_byte_lines,

729

self.text_sha1, self.text_size)

730

return True

731

732

688

def _unchanged(self, previous_ie):

733

689

"""See InventoryEntry._unchanged."""

734

690

compatible = super(InventoryFile, self)._unchanged(previous_ie)

829

785

compatible = False

830

786

return compatible

831

787

832

def _snapshot_text(self, file_parents, work_tree, commit_builder):

833

"""See InventoryEntry._snapshot_text."""

834

commit_builder.modified_link(

835

self.file_id, file_parents, self.symlink_target)

836

return True

837

838

788

839

789

class TreeReference(InventoryEntry):

840

790

850

800

return TreeReference(self.file_id, self.name, self.parent_id,

851

801

self.revision, self.reference_revision)

852

802

853

def _snapshot_text(self, file_parents, work_tree, commit_builder):

854

commit_builder.modified_reference(self.file_id, file_parents)

855

return True

856

857

803

def _read_tree_state(self, path, work_tree):

858

804

"""Populate fields in the inventory entry from the given tree.

859

805

"""

863

809

def _forget_tree_state(self):

864

810

self.reference_revision = None

865

811

812

def _unchanged(self, previous_ie):

813

"""See InventoryEntry._unchanged."""

814

compatible = super(TreeReference, self)._unchanged(previous_ie)

815

if self.reference_revision != previous_ie.reference_revision:

816

compatible = False

817

return compatible

818

866

819

867

820

class Inventory(object):

868

821

"""Inventory of versioned files in a tree.

923

876

self._byid = {}

924

877

self.revision_id = revision_id

925

878

879

def __repr__(self):

880

return "<Inventory object at %x, contents=%r>" % (id(self), self._byid)

881

882

def apply_delta(self, delta):

883

"""Apply a delta to this inventory.

884

885

:param delta: A list of changes to apply. After all the changes are

886

applied the final inventory must be internally consistent, but it

887

is ok to supply changes which, if only half-applied would have an

888

invalid result - such as supplying two changes which rename two

889

files, 'A' and 'B' with each other : [('A', 'B', 'A-id', a_entry),

890

('B', 'A', 'B-id', b_entry)].

891

892

Each change is a tuple, of the form (old_path, new_path, file_id,

893

new_entry).

894

895

When new_path is None, the change indicates the removal of an entry

896

from the inventory and new_entry will be ignored (using None is

897

appropriate). If new_path is not None, then new_entry must be an

898

InventoryEntry instance, which will be incorporated into the

899

inventory (and replace any existing entry with the same file id).

900

901

When old_path is None, the change indicates the addition of

902

a new entry to the inventory.

903

904

When neither new_path nor old_path are None, the change is a

905

modification to an entry, such as a rename, reparent, kind change

906

etc.

907

908

The children attribute of new_entry is ignored. This is because

909

this method preserves children automatically across alterations to

910

the parent of the children, and cases where the parent id of a

911

child is changing require the child to be passed in as a separate

912

change regardless. E.g. in the recursive deletion of a directory -

913

the directory's children must be included in the delta, or the

914

final inventory will be invalid.

915

"""

916

children = {}

917

# Remove all affected items which were in the original inventory,

918

# starting with the longest paths, thus ensuring parents are examined

919

# after their children, which means that everything we examine has no

920

# modified children remaining by the time we examine it.

921

for old_path, file_id in sorted(((op, f) for op, np, f, e in delta

922

if op is not None), reverse=True):

923

if file_id not in self:

924

# adds come later

925

continue

926

# Preserve unaltered children of file_id for later reinsertion.

927

children[file_id] = getattr(self[file_id], 'children', {})

928

# Remove file_id and the unaltered children. If file_id is not

929

# being deleted it will be reinserted back later.

930

self.remove_recursive_id(file_id)

931

# Insert all affected which should be in the new inventory, reattaching

932

# their children if they had any. This is done from shortest path to

933

# longest, ensuring that items which were modified and whose parents in

934

# the resulting inventory were also modified, are inserted after their

935

# parents.

936

for new_path, new_entry in sorted((np, e) for op, np, f, e in

937

delta if np is not None):

938

if new_entry.kind == 'directory':

939

new_entry.children = children.get(new_entry.file_id, {})

940

self.add(new_entry)

941

926

942

def _set_root(self, ie):

927

943

self.root = ie

928

944

self._byid = {self.root.file_id: self.root}

988

1004

# if we finished all children, pop it off the stack

989

1005

stack.pop()

990

1006

991

def iter_entries_by_dir(self, from_dir=None, specific_file_ids=None):

1007

def iter_entries_by_dir(self, from_dir=None, specific_file_ids=None,

1008

yield_parents=False):

992

1009

"""Iterate over the entries in a directory first order.

993

1010

994

1011

This returns all entries for a directory before returning

996

1013

lexicographically sorted order, and is a hybrid between

997

1014

depth-first and breadth-first.

998

1015

1016

:param yield_parents: If True, yield the parents from the root leading

1017

down to specific_file_ids that have been requested. This has no

1018

impact if specific_file_ids is None.

999

1019

:return: This yields (path, entry) pairs

1000

1020

"""

1001

1021

if specific_file_ids:

1007

1027

if self.root is None:

1008

1028

return

1009

1029

# Optimize a common case

1010

if specific_file_ids is not None and len(specific_file_ids) == 1:

1030

if (not yield_parents and specific_file_ids is not None and

1031

len(specific_file_ids) == 1):

1011

1032

file_id = list(specific_file_ids)[0]

1012

1033

if file_id in self:

1013

1034

yield self.id2path(file_id), self[file_id]

1014

1035

return

1015

1036

from_dir = self.root

1016

if (specific_file_ids is None or

1037

if (specific_file_ids is None or yield_parents or

1017

1038

self.root.file_id in specific_file_ids):

1018

1039

yield u'', self.root

1019

1040

elif isinstance(from_dir, basestring):

1048

1069

child_relpath = cur_relpath + child_name

1049

1070

1050

1071

if (specific_file_ids is None or

1051

child_ie.file_id in specific_file_ids):

1072

child_ie.file_id in specific_file_ids or

1073

(yield_parents and child_ie.file_id in parents)):

1052

1074

yield child_relpath, child_ie

1053

1075

1054

1076

if child_ie.kind == 'directory':

1355

1377

This does not move the working file.

1356

1378

"""

1357

1379

file_id = osutils.safe_file_id(file_id)

1380

new_name = ensure_normalized_name(new_name)

1358

1381

if not is_valid_name(new_name):

1359

1382

raise BzrError("not an acceptable filename: %r" % new_name)

1360

1383

1402

1425

file_id = generate_ids.gen_file_id(name)

1403

1426

else:

1404

1427

file_id = osutils.safe_file_id(file_id)

1405

1428

name = ensure_normalized_name(name)

1429

try:

1430

factory = entry_factory[kind]

1431

except KeyError:

1432

raise BzrError("unknown kind %r" % kind)

1433

return factory(file_id, name, parent_id)

1434

1435

1436

def ensure_normalized_name(name):

1437

"""Normalize name.

1438

1439

:raises InvalidNormalization: When name is not normalized, and cannot be

1440

accessed on this platform by the normalized path.

1441

:return: The NFC/NFKC normalised version of name.

1442

"""

1406

1443

#------- This has been copied to bzrlib.dirstate.DirState.add, please

1407

1444

# keep them synchronised.

1408

1445

# we dont import normalized_filename directly because we want to be

1410

1447

norm_name, can_access = osutils.normalized_filename(name)

1411

1448

if norm_name != name:

1412

1449

if can_access:

1413

name = norm_name

1450

return norm_name

1414

1451

else:

1415

1452

# TODO: jam 20060701 This would probably be more useful

1416

1453

# if the error was raised with the full path

1417

1454

raise errors.InvalidNormalization(name)

1418

1419

try:

1420

factory = entry_factory[kind]

1421

except KeyError:

1422

raise BzrError("unknown kind %r" % kind)

1423

return factory(file_id, name, parent_id)

1455

return name

1424

1456

1425

1457

1426

1458

_NAME_RE = None

Older »