~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: John Arbash Meinel
Date: 2009-06-17 17:57:15 UTC
mfrom: (4454 +trunk)
mto: This revision was merged to the branch mainline in revision 4460.
Revision ID: john@arbash-meinel.com-20090617175715-p9ebpwx5rhc0qin1

Merge bzr.dev 4454 in preparation for NEWS entry.

files added:
bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_chk_serializer.py

bzrlib/util/bencode.py

doc/developers/bug-handling.txt

doc/index.ru.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/time_graph.py

files removed:
bzrlib/util/tests/test_bencode.py

doc/developers/performance-contributing.txt

files renamed:
bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/benchmarks/__init__.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/errors.py

bzrlib/filters/__init__.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/eol.txt

bzrlib/index.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/mail_client.py

bzrlib/multiparent.py

bzrlib/osutils.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shellcomplete.py

bzrlib/smart/bzrdir.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/tag.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_config.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_source.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_ui.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/transform.py

bzrlib/transport/sftp.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/cycle.txt

doc/developers/index.txt

doc/developers/performance-roadmap.txt

doc/developers/planned-change-integration.txt

doc/developers/releasing.txt

doc/en/developer-guide/HACKING.txt

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.png

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/introducing_bazaar.txt

doc/index.txt

generate_docs.py

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

324

raise ValueError('invalid content_len %d for record @ pos %d'

325

% (content_len, pos - len_len - 1))

326

if kind == 'f': # Fulltext

327

result.append(('f', content_len))

327

if include_text:

328

text = self._content[pos:pos+content_len]

329

result.append(('f', content_len, text))

330

else:

331

result.append(('f', content_len))

328

332

elif kind == 'd': # Delta

329

333

delta_content = self._content[pos:pos+content_len]

330

334

delta_info = []

339

343

(offset, length,

340

344

delta_pos) = decode_copy_instruction(delta_content, c,

341

345

delta_pos)

342

delta_info.append(('c', offset, length))

346

if include_text:

347

text = self._content[offset:offset+length]

348

delta_info.append(('c', offset, length, text))

349

else:

350

delta_info.append(('c', offset, length))

343

351

measured_len += length

344

352

else: # Insert

345

353

if include_text:

746

754

747

755

After calling this, the compressor should no longer be used

748

756

"""

757

# TODO: this causes us to 'bloat' to 2x the size of content in the

758

# group. This has an impact for 'commit' of large objects.

759

# One possibility is to use self._content_chunks, and be lazy and

760

# only fill out self._content as a full string when we actually

761

# need it. That would at least drop the peak memory consumption

762

# for 'commit' down to ~1x the size of the largest file, at a

763

# cost of increased complexity within this code. 2x is still <<

764

# 3x the size of the largest file, so we are doing ok.

749

765

content = ''.join(self.chunks)

750

766

self.chunks = None

751

767

self._delta_index = None

1006

1022

if not parent_map:

1007

1023

raise errors.RevisionNotPresent(key, self)

1008

1024

if parent_map[key] is not None:

1009

search = graph._make_breadth_first_searcher([key])

1010

keys = set()

1011

while True:

1012

try:

1013

present, ghosts = search.next_with_ghosts()

1014

except StopIteration:

1015

break

1016

keys.update(present)

1017

parent_map = self.get_parent_map(keys)

1025

parent_map = dict((k, v) for k, v in graph.iter_ancestry([key])

1026

if v is not None)

1027

keys = parent_map.keys()

1018

1028

else:

1019

1029

keys = [key]

1020

1030

parent_map = {key:()}

1021

# So we used Graph(self) to load the parent_map, but now that we have

1022

# it, we can just query the parent map directly, so create a new Graph

1023

# object

1024

graph = _mod_graph.Graph(_mod_graph.DictParentsProvider(parent_map))

1025

head_cache = _mod_graph.FrozenHeadsCache(graph)

1031

# We used Graph(self) to load the parent_map, but now that we have it,

1032

# we can just query the parent map directly, so create a KnownGraph

1033

heads_provider = _mod_graph.KnownGraph(parent_map)

1026

1034

parent_cache = {}

1027

1035

reannotate = annotate.reannotate

1028

1036

for record in self.get_record_stream(keys, 'topological', True):

1030

1038

lines = osutils.chunks_to_lines(record.get_bytes_as('chunked'))

1031

1039

parent_lines = [parent_cache[parent] for parent in parent_map[key]]

1032

1040

parent_cache[key] = list(

1033

reannotate(parent_lines, lines, key, None, head_cache))

1041

reannotate(parent_lines, lines, key, None, heads_provider))

1034

1042

return parent_cache[key]

1035

1043

1036

1044

def check(self, progress_bar=None):

Older »