1080
by Martin Pool
- test tool for converting history to weave files |
1 |
#! /usr/bin/python
|
1267
by Martin Pool
- notes on conversion of existing history to weaves |
2 |
#
|
1080
by Martin Pool
- test tool for converting history to weave files |
3 |
# Copyright (C) 2005 Canonical Ltd
|
1267
by Martin Pool
- notes on conversion of existing history to weaves |
4 |
#
|
1080
by Martin Pool
- test tool for converting history to weave files |
5 |
# This program is free software; you can redistribute it and/or modify
|
6 |
# it under the terms of the GNU General Public License as published by
|
|
7 |
# the Free Software Foundation; either version 2 of the License, or
|
|
8 |
# (at your option) any later version.
|
|
1267
by Martin Pool
- notes on conversion of existing history to weaves |
9 |
#
|
1080
by Martin Pool
- test tool for converting history to weave files |
10 |
# This program is distributed in the hope that it will be useful,
|
11 |
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12 |
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13 |
# GNU General Public License for more details.
|
|
1267
by Martin Pool
- notes on conversion of existing history to weaves |
14 |
#
|
1080
by Martin Pool
- test tool for converting history to weave files |
15 |
# You should have received a copy of the GNU General Public License
|
16 |
# along with this program; if not, write to the Free Software
|
|
17 |
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
18 |
||
19 |
"""Experiment in converting existing bzr branches to weaves."""
|
|
20 |
||
1267
by Martin Pool
- notes on conversion of existing history to weaves |
21 |
# To make this properly useful
|
22 |
#
|
|
23 |
# 1. assign text version ids, and put those text versions into
|
|
24 |
# the inventory as they're converted.
|
|
25 |
#
|
|
26 |
# 2. keep track of the previous version of each file, rather than
|
|
27 |
# just using the last one imported
|
|
28 |
#
|
|
29 |
# 3. assign entry versions when files are added, renamed or moved.
|
|
30 |
#
|
|
31 |
# 4. when merged-in versions are observed, walk down through them
|
|
32 |
# to discover everything, then commit bottom-up
|
|
33 |
#
|
|
34 |
# 5. track ancestry as things are merged in, and commit that in each
|
|
35 |
# revision
|
|
36 |
#
|
|
37 |
# Perhaps it's best to first walk the whole graph and make a plan for
|
|
38 |
# what should be imported in what order? Need a kind of topological
|
|
39 |
# sort of all revisions. (Or do we, can we just before doing a revision
|
|
40 |
# see that all its parents have either been converted or abandoned?)
|
|
41 |
||
1315
by Martin Pool
- import file inventories in correct order |
42 |
|
43 |
# Cannot import a revision until all its parents have been
|
|
44 |
# imported. in other words, we can only import revisions whose
|
|
45 |
# parents have all been imported. the first step must be to
|
|
46 |
# import a revision with no parents, of which there must be at
|
|
47 |
# least one. (So perhaps it's useful to store forward pointers
|
|
48 |
# from a list of parents to their children?)
|
|
49 |
#
|
|
50 |
# Another (equivalent?) approach is to build up the ordered
|
|
51 |
# ancestry list for the last revision, and walk through that. We
|
|
52 |
# are going to need that.
|
|
53 |
#
|
|
54 |
# We don't want to have to recurse all the way back down the list.
|
|
55 |
#
|
|
56 |
# Suppose we keep a queue of the revisions able to be processed at
|
|
57 |
# any point. This starts out with all the revisions having no
|
|
58 |
# parents.
|
|
59 |
#
|
|
60 |
# This seems like a generally useful algorithm...
|
|
61 |
#
|
|
62 |
# The current algorithm is dumb (O(n**2)?) but will do the job, and
|
|
63 |
# takes less than a second on the bzr.dev branch.
|
|
64 |
||
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
65 |
# This currently does a kind of lazy conversion of file texts, where a
|
66 |
# new text is written in every version. That's unnecessary but for
|
|
67 |
# the moment saves us having to worry about when files need new
|
|
68 |
# versions.
|
|
69 |
||
70 |
||
1350
by Martin Pool
- set reasonable name_versions |
71 |
if False: |
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
72 |
try: |
73 |
import psyco |
|
74 |
psyco.full() |
|
75 |
except ImportError: |
|
76 |
pass
|
|
1083
by Martin Pool
- add space to store revision-id in weave files |
77 |
|
1080
by Martin Pool
- test tool for converting history to weave files |
78 |
|
1352
by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves |
79 |
import os |
1267
by Martin Pool
- notes on conversion of existing history to weaves |
80 |
import tempfile |
81 |
import sys |
|
1132
by Martin Pool
- fix up logging for history2weaves tool |
82 |
import logging |
1352
by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves |
83 |
import shutil |
1132
by Martin Pool
- fix up logging for history2weaves tool |
84 |
|
1355
by Martin Pool
- write working inventory into final location |
85 |
from bzrlib.branch import Branch, find_branch, BZR_BRANCH_FORMAT_5 |
1080
by Martin Pool
- test tool for converting history to weave files |
86 |
from bzrlib.revfile import Revfile |
87 |
from bzrlib.weave import Weave |
|
88 |
from bzrlib.weavefile import read_weave, write_weave |
|
89 |
from bzrlib.progress import ProgressBar |
|
90 |
from bzrlib.atomicfile import AtomicFile |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
91 |
from bzrlib.xml4 import serializer_v4 |
92 |
from bzrlib.xml5 import serializer_v5 |
|
1307
by Martin Pool
- start walking through ancestors in conversion to weaves |
93 |
from bzrlib.trace import mutter, note, warning, enable_default_logging |
1326
by Martin Pool
- check inventory sha when loading old revisions |
94 |
from bzrlib.osutils import sha_strings, sha_string |
1337
by Martin Pool
- produce ancestry when converting versions |
95 |
from bzrlib.commit import merge_ancestry_lines |
1267
by Martin Pool
- notes on conversion of existing history to weaves |
96 |
|
1080
by Martin Pool
- test tool for converting history to weave files |
97 |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
98 |
class Convert(object): |
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
99 |
def __init__(self, base_dir): |
100 |
self.base = base_dir |
|
1307
by Martin Pool
- start walking through ancestors in conversion to weaves |
101 |
self.converted_revs = set() |
102 |
self.absent_revisions = set() |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
103 |
self.text_count = 0 |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
104 |
self.revisions = {} |
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
105 |
self.convert() |
106 |
||
107 |
||
108 |
def convert(self): |
|
1382
by Martin Pool
- upgrade checks if branch is uptodate before anything else |
109 |
if not self._open_branch(): |
110 |
return
|
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
111 |
note('starting upgrade of %s', os.path.abspath(self.base)) |
1381
by Martin Pool
- remove tab characters (only) |
112 |
self._backup_control_dir() |
113 |
note('starting upgrade') |
|
114 |
note('note: upgrade may be faster if all store files are ungzipped first') |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
115 |
self.pb = ProgressBar() |
1381
by Martin Pool
- remove tab characters (only) |
116 |
if not os.path.isdir(self.base + '/.bzr/weaves'): |
117 |
os.mkdir(self.base + '/.bzr/weaves') |
|
1382
by Martin Pool
- upgrade checks if branch is uptodate before anything else |
118 |
self.inv_weave = Weave('inventory') |
119 |
self.anc_weave = Weave('ancestry') |
|
1337
by Martin Pool
- produce ancestry when converting versions |
120 |
self.ancestries = {} |
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
121 |
# holds in-memory weaves for all files
|
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
122 |
self.text_weaves = {} |
1381
by Martin Pool
- remove tab characters (only) |
123 |
os.remove(self.branch.controlfilename('branch-format')) |
124 |
self._convert_working_inv() |
|
1358
by Martin Pool
- actually upgrade all of history |
125 |
rev_history = self.branch.revision_history() |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
126 |
# to_read is a stack holding the revisions we still need to process;
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
127 |
# appending to it adds new highest-priority revisions
|
1319
by Martin Pool
- calculate and use file parents for importing texts |
128 |
self.known_revisions = set(rev_history) |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
129 |
self.to_read = [rev_history[-1]] |
130 |
while self.to_read: |
|
131 |
rev_id = self.to_read.pop() |
|
132 |
if (rev_id not in self.revisions |
|
133 |
and rev_id not in self.absent_revisions): |
|
134 |
self._load_one_rev(rev_id) |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
135 |
self.pb.clear() |
1332
by Martin Pool
- clean up code that writes out weave results |
136 |
to_import = self._make_order() |
1315
by Martin Pool
- import file inventories in correct order |
137 |
for i, rev_id in enumerate(to_import): |
138 |
self.pb.update('converting revision', i, len(to_import)) |
|
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
139 |
self._convert_one_rev(rev_id) |
1331
by Martin Pool
- write out new revisions after conversion |
140 |
self.pb.clear() |
1352
by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves |
141 |
note('upgraded to weaves:') |
142 |
note(' %6d revisions and inventories' % len(self.revisions)) |
|
143 |
note(' %6d absent revisions removed' % len(self.absent_revisions)) |
|
144 |
note(' %6d texts' % self.text_count) |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
145 |
self._write_all_weaves() |
1331
by Martin Pool
- write out new revisions after conversion |
146 |
self._write_all_revs() |
1381
by Martin Pool
- remove tab characters (only) |
147 |
self._set_new_format() |
148 |
self._cleanup_spare_files() |
|
1357
by Martin Pool
- require marker file to do upgrade so as not to clobber something important |
149 |
|
150 |
||
1382
by Martin Pool
- upgrade checks if branch is uptodate before anything else |
151 |
def _open_branch(self): |
1393.1.2
by Martin Pool
- better representation in Branch factories of opening old formats |
152 |
self.branch = Branch.open_downlevel(self.base) |
1382
by Martin Pool
- upgrade checks if branch is uptodate before anything else |
153 |
if self.branch._branch_format == 5: |
154 |
note('this branch is already in the most current format') |
|
155 |
return False |
|
156 |
if self.branch._branch_format != 4: |
|
157 |
raise BzrError("cannot upgrade from branch format %r" % |
|
158 |
self.branch._branch_format) |
|
159 |
return True |
|
160 |
||
161 |
||
1357
by Martin Pool
- require marker file to do upgrade so as not to clobber something important |
162 |
def _set_new_format(self): |
1381
by Martin Pool
- remove tab characters (only) |
163 |
f = self.branch.controlfile('branch-format', 'wb') |
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
164 |
try: |
1381
by Martin Pool
- remove tab characters (only) |
165 |
f.write(BZR_BRANCH_FORMAT_5) |
166 |
finally: |
|
167 |
f.close() |
|
1355
by Martin Pool
- write working inventory into final location |
168 |
|
169 |
||
170 |
def _cleanup_spare_files(self): |
|
1381
by Martin Pool
- remove tab characters (only) |
171 |
for n in 'merged-patches', 'pending-merged-patches': |
172 |
p = self.branch.controlfilename(n) |
|
173 |
if not os.path.exists(p): |
|
174 |
continue
|
|
175 |
## assert os.path.getsize(p) == 0
|
|
176 |
os.remove(p) |
|
177 |
shutil.rmtree(self.base + '/.bzr/inventory-store') |
|
178 |
shutil.rmtree(self.base + '/.bzr/text-store') |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
179 |
|
180 |
||
1352
by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves |
181 |
def _backup_control_dir(self): |
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
182 |
orig = self.base + '/.bzr' |
183 |
backup = orig + '.backup' |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
184 |
note('making backup of tree history') |
1381
by Martin Pool
- remove tab characters (only) |
185 |
shutil.copytree(orig, backup) |
186 |
note('%s has been backed up to %s', orig, backup) |
|
187 |
note('if conversion fails, you can move this directory back to .bzr') |
|
188 |
note('if it succeeds, you can remove this directory if you wish') |
|
1352
by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves |
189 |
|
190 |
||
191 |
def _convert_working_inv(self): |
|
1381
by Martin Pool
- remove tab characters (only) |
192 |
branch = self.branch |
193 |
inv = serializer_v4.read_inventory(branch.controlfile('inventory', 'rb')) |
|
194 |
serializer_v5.write_inventory(inv, branch.controlfile('inventory', 'wb')) |
|
1352
by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves |
195 |
|
196 |
||
197 |
||
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
198 |
def _write_all_weaves(self): |
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
199 |
write_a_weave(self.inv_weave, self.base + '/.bzr/inventory.weave') |
200 |
write_a_weave(self.anc_weave, self.base + '/.bzr/ancestry.weave') |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
201 |
i = 0 |
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
202 |
try: |
203 |
for file_id, file_weave in self.text_weaves.items(): |
|
204 |
self.pb.update('writing weave', i, len(self.text_weaves)) |
|
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
205 |
write_a_weave(file_weave, self.base + '/.bzr/weaves/%s.weave' % file_id) |
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
206 |
i += 1 |
207 |
finally: |
|
208 |
self.pb.clear() |
|
1300
by Martin Pool
- refactor weave upgrade into a MethodObject |
209 |
|
1331
by Martin Pool
- write out new revisions after conversion |
210 |
|
211 |
def _write_all_revs(self): |
|
212 |
"""Write all revisions out in new form."""
|
|
1381
by Martin Pool
- remove tab characters (only) |
213 |
shutil.rmtree(self.base + '/.bzr/revision-store') |
214 |
os.mkdir(self.base + '/.bzr/revision-store') |
|
1331
by Martin Pool
- write out new revisions after conversion |
215 |
try: |
216 |
for i, rev_id in enumerate(self.converted_revs): |
|
217 |
self.pb.update('write revision', i, len(self.converted_revs)) |
|
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
218 |
f = file(self.base + '/.bzr/revision-store/%s' % rev_id, 'wb') |
1331
by Martin Pool
- write out new revisions after conversion |
219 |
try: |
220 |
serializer_v5.write_revision(self.revisions[rev_id], f) |
|
221 |
finally: |
|
222 |
f.close() |
|
223 |
finally: |
|
224 |
self.pb.clear() |
|
1332
by Martin Pool
- clean up code that writes out weave results |
225 |
|
1331
by Martin Pool
- write out new revisions after conversion |
226 |
|
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
227 |
def _load_one_rev(self, rev_id): |
228 |
"""Load a revision object into memory.
|
|
229 |
||
230 |
Any parents not either loaded or abandoned get queued to be
|
|
231 |
loaded."""
|
|
232 |
self.pb.update('loading revision', |
|
1315
by Martin Pool
- import file inventories in correct order |
233 |
len(self.revisions), |
1319
by Martin Pool
- calculate and use file parents for importing texts |
234 |
len(self.known_revisions)) |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
235 |
if rev_id not in self.branch.revision_store: |
236 |
self.pb.clear() |
|
237 |
note('revision {%s} not present in branch; ' |
|
238 |
'will not be converted', |
|
239 |
rev_id) |
|
240 |
self.absent_revisions.add(rev_id) |
|
241 |
else: |
|
242 |
rev_xml = self.branch.revision_store[rev_id].read() |
|
243 |
rev = serializer_v4.read_revision_from_string(rev_xml) |
|
1313
by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage |
244 |
for parent_id in rev.parent_ids: |
1319
by Martin Pool
- calculate and use file parents for importing texts |
245 |
self.known_revisions.add(parent_id) |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
246 |
self.to_read.append(parent_id) |
247 |
self.revisions[rev_id] = rev |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
248 |
|
249 |
||
250 |
def _load_old_inventory(self, rev_id): |
|
251 |
assert rev_id not in self.converted_revs |
|
252 |
old_inv_xml = self.branch.inventory_store[rev_id].read() |
|
253 |
inv = serializer_v4.read_inventory_from_string(old_inv_xml) |
|
254 |
rev = self.revisions[rev_id] |
|
255 |
if rev.inventory_sha1: |
|
256 |
assert rev.inventory_sha1 == sha_string(old_inv_xml), \ |
|
257 |
'inventory sha mismatch for {%s}' % rev_id |
|
258 |
return inv |
|
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
259 |
|
260 |
||
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
261 |
def _load_updated_inventory(self, rev_id): |
262 |
assert rev_id in self.converted_revs |
|
263 |
inv_xml = self.inv_weave.get_text(rev_id) |
|
264 |
inv = serializer_v5.read_inventory_from_string(inv_xml) |
|
265 |
return inv |
|
266 |
||
267 |
||
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
268 |
def _convert_one_rev(self, rev_id): |
269 |
"""Convert revision and all referenced objects to new format."""
|
|
270 |
rev = self.revisions[rev_id] |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
271 |
inv = self._load_old_inventory(rev_id) |
1337
by Martin Pool
- produce ancestry when converting versions |
272 |
for parent_id in rev.parent_ids[:]: |
273 |
if parent_id in self.absent_revisions: |
|
274 |
rev.parent_ids.remove(parent_id) |
|
275 |
self.pb.clear() |
|
276 |
note('remove {%s} as parent of {%s}', parent_id, rev_id) |
|
1320
by Martin Pool
- write updated inventory into weave |
277 |
self._convert_revision_contents(rev, inv) |
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
278 |
self._store_new_weave(rev, inv) |
279 |
self._make_rev_ancestry(rev) |
|
280 |
self.converted_revs.add(rev_id) |
|
281 |
||
282 |
||
283 |
def _store_new_weave(self, rev, inv): |
|
1320
by Martin Pool
- write updated inventory into weave |
284 |
# the XML is now updated with text versions
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
285 |
if __debug__: |
286 |
for file_id in inv: |
|
287 |
ie = inv[file_id] |
|
288 |
if ie.kind == 'root_directory': |
|
289 |
continue
|
|
290 |
assert hasattr(ie, 'name_version'), \ |
|
291 |
'no name_version on {%s} in {%s}' % \ |
|
292 |
(file_id, rev.revision_id) |
|
293 |
if ie.kind == 'file': |
|
294 |
assert hasattr(ie, 'text_version') |
|
295 |
||
1316
by Martin Pool
- upgrade format of inventories as they're converted |
296 |
new_inv_xml = serializer_v5.write_inventory_to_string(inv) |
1325
by Martin Pool
- conversion to weave tries to avoid repeated SHA calculation |
297 |
new_inv_sha1 = sha_string(new_inv_xml) |
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
298 |
self.inv_weave.add(rev.revision_id, rev.parent_ids, |
1325
by Martin Pool
- conversion to weave tries to avoid repeated SHA calculation |
299 |
new_inv_xml.splitlines(True), |
300 |
new_inv_sha1) |
|
301 |
rev.inventory_sha1 = new_inv_sha1 |
|
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
302 |
|
303 |
||
1337
by Martin Pool
- produce ancestry when converting versions |
304 |
def _make_rev_ancestry(self, rev): |
305 |
rev_id = rev.revision_id |
|
306 |
for parent_id in rev.parent_ids: |
|
307 |
assert parent_id in self.converted_revs |
|
1340
by Martin Pool
- conversion to weave computes ancestries using weave mash |
308 |
if rev.parent_ids: |
309 |
lines = list(self.anc_weave.mash_iter(rev.parent_ids)) |
|
310 |
else: |
|
311 |
lines = [] |
|
312 |
lines.append(rev_id + '\n') |
|
313 |
if __debug__: |
|
314 |
parent_ancestries = [self.ancestries[p] for p in rev.parent_ids] |
|
315 |
new_lines = merge_ancestry_lines(rev_id, parent_ancestries) |
|
316 |
assert set(lines) == set(new_lines) |
|
317 |
self.ancestries[rev_id] = new_lines |
|
318 |
self.anc_weave.add(rev_id, rev.parent_ids, lines) |
|
1337
by Martin Pool
- produce ancestry when converting versions |
319 |
|
320 |
||
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
321 |
def _convert_revision_contents(self, rev, inv): |
322 |
"""Convert all the files within a revision.
|
|
323 |
||
324 |
Also upgrade the inventory to refer to the text revision ids."""
|
|
325 |
rev_id = rev.revision_id |
|
1319
by Martin Pool
- calculate and use file parents for importing texts |
326 |
mutter('converting texts of revision {%s}', |
327 |
rev_id) |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
328 |
parent_invs = map(self._load_updated_inventory, rev.parent_ids) |
1332
by Martin Pool
- clean up code that writes out weave results |
329 |
for file_id in inv: |
330 |
ie = inv[file_id] |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
331 |
self._set_name_version(rev, ie, parent_invs) |
1318
by Martin Pool
- pull texts into weaves in a fairly lazy way |
332 |
if ie.kind != 'file': |
333 |
continue
|
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
334 |
self._convert_file_version(rev, ie, parent_invs) |
335 |
||
336 |
||
337 |
def _set_name_version(self, rev, ie, parent_invs): |
|
1381
by Martin Pool
- remove tab characters (only) |
338 |
"""Set name version for a file.
|
1350
by Martin Pool
- set reasonable name_versions |
339 |
|
1381
by Martin Pool
- remove tab characters (only) |
340 |
Done in a slightly lazy way: if the file is renamed or in a merge revision
|
341 |
it gets a new version, otherwise the same as before.
|
|
342 |
"""
|
|
343 |
file_id = ie.file_id |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
344 |
if ie.kind == 'root_directory': |
345 |
return
|
|
346 |
if len(parent_invs) != 1: |
|
1381
by Martin Pool
- remove tab characters (only) |
347 |
ie.name_version = rev.revision_id |
348 |
else: |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
349 |
old_inv = parent_invs[0] |
1381
by Martin Pool
- remove tab characters (only) |
350 |
if not old_inv.has_id(file_id): |
351 |
ie.name_version = rev.revision_id |
|
352 |
else: |
|
353 |
old_ie = old_inv[file_id] |
|
354 |
if (old_ie.parent_id != ie.parent_id |
|
355 |
or old_ie.name != ie.name): |
|
356 |
ie.name_version = rev.revision_id |
|
357 |
else: |
|
358 |
ie.name_version = old_ie.name_version |
|
1350
by Martin Pool
- set reasonable name_versions |
359 |
|
1319
by Martin Pool
- calculate and use file parents for importing texts |
360 |
|
361 |
||
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
362 |
def _convert_file_version(self, rev, ie, parent_invs): |
1319
by Martin Pool
- calculate and use file parents for importing texts |
363 |
"""Convert one version of one file.
|
364 |
||
365 |
The file needs to be added into the weave if it is a merge
|
|
366 |
of >=2 parents or if it's changed from its parent.
|
|
367 |
"""
|
|
368 |
file_id = ie.file_id |
|
369 |
rev_id = rev.revision_id |
|
370 |
w = self.text_weaves.get(file_id) |
|
371 |
if w is None: |
|
372 |
w = Weave(file_id) |
|
373 |
self.text_weaves[file_id] = w |
|
374 |
file_parents = [] |
|
375 |
text_changed = False |
|
1386
by Martin Pool
- avoiding loading all inventories upfront for conversion |
376 |
for parent_inv in parent_invs: |
1319
by Martin Pool
- calculate and use file parents for importing texts |
377 |
if parent_inv.has_id(file_id): |
378 |
parent_ie = parent_inv[file_id] |
|
379 |
old_text_version = parent_ie.text_version |
|
380 |
assert old_text_version in self.converted_revs |
|
381 |
if old_text_version not in file_parents: |
|
382 |
file_parents.append(old_text_version) |
|
383 |
if parent_ie.text_sha1 != ie.text_sha1: |
|
384 |
text_changed = True |
|
385 |
if len(file_parents) != 1 or text_changed: |
|
1378
by Martin Pool
- in upgrade, avoiding loading file texts unless necessary |
386 |
file_lines = self.branch.text_store[ie.text_id].readlines() |
387 |
assert sha_strings(file_lines) == ie.text_sha1 |
|
388 |
assert sum(map(len, file_lines)) == ie.text_size |
|
1325
by Martin Pool
- conversion to weave tries to avoid repeated SHA calculation |
389 |
w.add(rev_id, file_parents, file_lines, ie.text_sha1) |
1350
by Martin Pool
- set reasonable name_versions |
390 |
ie.text_version = rev_id |
1332
by Martin Pool
- clean up code that writes out weave results |
391 |
self.text_count += 1 |
1330
by Martin Pool
- fiddle with trace |
392 |
##mutter('import text {%s} of {%s}',
|
393 |
## ie.text_id, file_id)
|
|
1319
by Martin Pool
- calculate and use file parents for importing texts |
394 |
else: |
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
395 |
##mutter('text of {%s} unchanged from parent', file_id)
|
1319
by Martin Pool
- calculate and use file parents for importing texts |
396 |
ie.text_version = file_parents[0] |
397 |
del ie.text_id |
|
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
398 |
|
1310
by Martin Pool
- compute order to import revisions |
399 |
|
400 |
||
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
401 |
def _make_order(self): |
1310
by Martin Pool
- compute order to import revisions |
402 |
"""Return a suitable order for importing revisions.
|
403 |
||
404 |
The order must be such that an revision is imported after all
|
|
405 |
its (present) parents.
|
|
406 |
"""
|
|
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
407 |
todo = set(self.revisions.keys()) |
408 |
done = self.absent_revisions.copy() |
|
1310
by Martin Pool
- compute order to import revisions |
409 |
o = [] |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
410 |
while todo: |
411 |
# scan through looking for a revision whose parents
|
|
412 |
# are all done
|
|
1310
by Martin Pool
- compute order to import revisions |
413 |
for rev_id in sorted(list(todo)): |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
414 |
rev = self.revisions[rev_id] |
1313
by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage |
415 |
parent_ids = set(rev.parent_ids) |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
416 |
if parent_ids.issubset(done): |
417 |
# can take this one now
|
|
1310
by Martin Pool
- compute order to import revisions |
418 |
o.append(rev_id) |
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
419 |
todo.remove(rev_id) |
420 |
done.add(rev_id) |
|
1315
by Martin Pool
- import file inventories in correct order |
421 |
return o |
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
422 |
|
1309
by Martin Pool
- first cut at tsort to make order to bring in revisions |
423 |
|
1332
by Martin Pool
- clean up code that writes out weave results |
424 |
def write_a_weave(weave, filename): |
425 |
inv_wf = file(filename, 'wb') |
|
1080
by Martin Pool
- test tool for converting history to weave files |
426 |
try: |
1087
by Martin Pool
- add a tool script to convert past history into weaves |
427 |
write_weave(weave, inv_wf) |
1080
by Martin Pool
- test tool for converting history to weave files |
428 |
finally: |
429 |
inv_wf.close() |
|
430 |
||
1377
by Martin Pool
- run conversion to weaves from the 'bzr upgrade' command |
431 |
|
432 |
def upgrade(base_dir): |
|
433 |
Convert(base_dir) |