0.1.1
by Martin Pool
Check in old existing knit code. |
1 |
#! /usr/bin/python
|
2 |
||
3 |
# Copyright (C) 2005 Canonical Ltd
|
|
4 |
||
0.1.33
by Martin Pool
add gpl text |
5 |
# This program is free software; you can redistribute it and/or modify
|
6 |
# it under the terms of the GNU General Public License as published by
|
|
7 |
# the Free Software Foundation; either version 2 of the License, or
|
|
8 |
# (at your option) any later version.
|
|
9 |
||
10 |
# This program is distributed in the hope that it will be useful,
|
|
11 |
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12 |
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13 |
# GNU General Public License for more details.
|
|
14 |
||
15 |
# You should have received a copy of the GNU General Public License
|
|
16 |
# along with this program; if not, write to the Free Software
|
|
17 |
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
0.1.1
by Martin Pool
Check in old existing knit code. |
18 |
|
19 |
# Author: Martin Pool <mbp@canonical.com>
|
|
20 |
||
21 |
||
0.1.38
by Martin Pool
Rename knit to weave. (I don't think there's an existing module called weave.) |
22 |
"""Weave - storage of related text file versions"""
|
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
23 |
|
0.1.61
by Martin Pool
doc |
24 |
# TODO: Perhaps have copy method for Weave instances?
|
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
25 |
|
0.1.58
by Martin Pool
doc |
26 |
# XXX: If we do weaves this way, will a merge still behave the same
|
27 |
# way if it's done in a different order? That's a pretty desirable
|
|
28 |
# property.
|
|
29 |
||
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
30 |
# TODO: How to write these to disk? One option is cPickle, which
|
31 |
# would be fast but less friendly to C, and perhaps not portable. Another is
|
|
32 |
||
33 |
# TODO: Nothing here so far assumes the lines are really \n newlines,
|
|
34 |
# rather than being split up in some other way. We could accomodate
|
|
35 |
# binaries, perhaps by naively splitting on \n or perhaps using
|
|
36 |
# something like a rolling checksum.
|
|
37 |
||
38 |
# TODO: Perhaps track SHA-1 in the header for protection? This would
|
|
39 |
# be redundant with it being stored in the inventory, but perhaps
|
|
40 |
# usefully so?
|
|
41 |
||
42 |
# TODO: Track version names as well as indexes.
|
|
43 |
||
44 |
# TODO: Probably do transitive expansion when specifying parents?
|
|
0.1.58
by Martin Pool
doc |
45 |
|
0.1.68
by Martin Pool
doc |
46 |
# TODO: Separate out some code to read and write weaves.
|
47 |
||
0.1.85
by Martin Pool
doc |
48 |
# TODO: End marker for each version so we can stop reading?
|
0.1.69
by Martin Pool
Simple text-based format for storing weaves, cleaner than |
49 |
|
50 |
# TODO: Check that no insertion occurs inside a deletion that was
|
|
51 |
# active in the version of the insertion.
|
|
52 |
||
0.1.85
by Martin Pool
doc |
53 |
# TODO: Perhaps a special slower check() method that verifies more
|
54 |
# nesting constraints and the MD5 of each version?
|
|
55 |
||
56 |
||
0.1.34
by Martin Pool
remove dead code |
57 |
|
0.1.66
by Martin Pool
Cope without set/frozenset classes |
58 |
try: |
59 |
set
|
|
60 |
frozenset
|
|
61 |
except NameError: |
|
62 |
from sets import Set, ImmutableSet |
|
63 |
set = Set |
|
64 |
frozenset = ImmutableSet |
|
0.1.67
by Martin Pool
More fixes to try to run on python2.3 |
65 |
del Set, ImmutableSet |
0.1.66
by Martin Pool
Cope without set/frozenset classes |
66 |
|
67 |
||
0.1.47
by Martin Pool
New WeaveError and WeaveFormatError rather than assertions. |
68 |
class WeaveError(Exception): |
69 |
"""Exception in processing weave"""
|
|
70 |
||
71 |
||
72 |
class WeaveFormatError(WeaveError): |
|
73 |
"""Weave invariant violated"""
|
|
74 |
||
75 |
||
0.1.38
by Martin Pool
Rename knit to weave. (I don't think there's an existing module called weave.) |
76 |
class Weave(object): |
77 |
"""weave - versioned text file storage.
|
|
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
78 |
|
0.1.72
by Martin Pool
Go back to weave lines normally having newlines at the end. |
79 |
A Weave manages versions of line-based text files, keeping track
|
80 |
of the originating version for each line.
|
|
81 |
||
82 |
To clients the "lines" of the file are represented as a list of strings.
|
|
83 |
These strings will typically have terminal newline characters, but
|
|
84 |
this is not required. In particular files commonly do not have a newline
|
|
85 |
at the end of the file.
|
|
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
86 |
|
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
87 |
Texts can be identified in either of two ways:
|
88 |
||
89 |
* a nonnegative index number.
|
|
90 |
||
91 |
* a version-id string.
|
|
92 |
||
0.1.38
by Martin Pool
Rename knit to weave. (I don't think there's an existing module called weave.) |
93 |
Typically the index number will be valid only inside this weave and
|
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
94 |
the version-id is used to reference it in the larger world.
|
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
95 |
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
96 |
The weave is represented as a list mixing edit instructions and
|
97 |
literal text. Each entry in _l can be either a string (or
|
|
98 |
unicode), or a tuple. If a string, it means that the given line
|
|
99 |
should be output in the currently active revisions.
|
|
100 |
||
101 |
If a tuple, it gives a processing instruction saying in which
|
|
102 |
revisions the enclosed lines are active. The tuple has the form
|
|
103 |
(instruction, version).
|
|
104 |
||
105 |
The instruction can be '{' or '}' for an insertion block, and '['
|
|
106 |
and ']' for a deletion block respectively. The version is the
|
|
0.1.45
by Martin Pool
doc |
107 |
integer version index. There is no replace operator, only deletes
|
108 |
and inserts.
|
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
109 |
|
0.1.41
by Martin Pool
Doc |
110 |
Constraints/notes:
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
111 |
|
112 |
* A later version can delete lines that were introduced by any
|
|
113 |
number of ancestor versions; this implies that deletion
|
|
114 |
instructions can span insertion blocks without regard to the
|
|
115 |
insertion block's nesting.
|
|
116 |
||
0.1.41
by Martin Pool
Doc |
117 |
* Similarly, deletions need not be properly nested with regard to
|
118 |
each other, because they might have been generated by
|
|
119 |
independent revisions.
|
|
120 |
||
0.1.45
by Martin Pool
doc |
121 |
* Insertions are always made by inserting a new bracketed block
|
122 |
into a single point in the previous weave. This implies they
|
|
123 |
can nest but not overlap, and the nesting must always have later
|
|
124 |
insertions on the inside.
|
|
125 |
||
0.1.41
by Martin Pool
Doc |
126 |
* It doesn't seem very useful to have an active insertion
|
127 |
inside an inactive insertion, but it might happen.
|
|
0.1.45
by Martin Pool
doc |
128 |
|
0.1.41
by Martin Pool
Doc |
129 |
* Therefore, all instructions are always"considered"; that
|
130 |
is passed onto and off the stack. An outer inactive block
|
|
131 |
doesn't disable an inner block.
|
|
132 |
||
133 |
* Lines are enabled if the most recent enclosing insertion is
|
|
134 |
active and none of the enclosing deletions are active.
|
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
135 |
|
0.1.49
by Martin Pool
Add another constraint: revisions should not delete text that they |
136 |
* There is no point having a deletion directly inside its own
|
137 |
insertion; you might as well just not write it. And there
|
|
138 |
should be no way to get an earlier version deleting a later
|
|
139 |
version.
|
|
140 |
||
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
141 |
_l
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
142 |
Text of the weave.
|
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
143 |
|
144 |
_v
|
|
0.1.13
by Martin Pool
Knit structure now allows for versions to include the lines present in other |
145 |
List of versions, indexed by index number.
|
146 |
||
0.1.77
by Martin Pool
New Weave.get_included() does transitive expansion |
147 |
For each version we store the set (included_versions), which
|
148 |
lists the previous versions also considered active; the
|
|
149 |
versions included in those versions are included transitively.
|
|
150 |
So new versions created from nothing list []; most versions
|
|
151 |
have a single entry; some have more.
|
|
0.1.89
by Martin Pool
Store SHA1 in weave file for later verification |
152 |
|
153 |
_sha1s
|
|
154 |
List of hex SHA-1 of each version, or None if not recorded.
|
|
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
155 |
"""
|
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
156 |
def __init__(self): |
157 |
self._l = [] |
|
158 |
self._v = [] |
|
0.1.89
by Martin Pool
Store SHA1 in weave file for later verification |
159 |
self._sha1s = [] |
0.1.60
by Martin Pool
Weave eq and ne methods |
160 |
|
161 |
||
162 |
def __eq__(self, other): |
|
163 |
if not isinstance(other, Weave): |
|
164 |
return False |
|
165 |
return self._v == other._v \ |
|
166 |
and self._l == other._l |
|
167 |
||
168 |
||
169 |
def __ne__(self, other): |
|
170 |
return not self.__eq__(other) |
|
171 |
||
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
172 |
|
0.1.26
by Martin Pool
Refactor parameters to add command |
173 |
def add(self, parents, text): |
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
174 |
"""Add a single text on top of the weave.
|
0.1.36
by Martin Pool
doc |
175 |
|
0.1.26
by Martin Pool
Refactor parameters to add command |
176 |
Returns the index number of the newly added version.
|
177 |
||
178 |
parents
|
|
0.1.64
by Martin Pool
Add test for merging versions |
179 |
List or set of parent version numbers. This must normally include
|
180 |
the parents and the parent's parents, or wierd things might happen.
|
|
0.1.26
by Martin Pool
Refactor parameters to add command |
181 |
|
182 |
text
|
|
183 |
Sequence of lines to be added in the new version."""
|
|
0.1.82
by Martin Pool
Small weave optimizations |
184 |
## self._check_versions(parents)
|
185 |
## self._check_lines(text)
|
|
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
186 |
idx = len(self._v) |
0.1.5
by Martin Pool
Add test for storing two text versions. |
187 |
|
0.1.89
by Martin Pool
Store SHA1 in weave file for later verification |
188 |
import sha |
189 |
s = sha.new() |
|
190 |
for l in text: |
|
191 |
s.update(l) |
|
192 |
sha1 = s.hexdigest() |
|
193 |
del s |
|
194 |
||
0.1.26
by Martin Pool
Refactor parameters to add command |
195 |
if parents: |
0.1.78
by Martin Pool
Rename Weave.get_included to inclusions and getiter to get_iter |
196 |
delta = self._delta(self.inclusions(parents), text) |
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
197 |
|
0.1.31
by Martin Pool
Fix insertion of multiple regions, calculating the right line offset as we go. |
198 |
# offset gives the number of lines that have been inserted
|
199 |
# into the weave up to the current point; if the original edit instruction
|
|
200 |
# says to change line A then we actually change (A+offset)
|
|
201 |
offset = 0 |
|
202 |
||
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
203 |
for i1, i2, newlines in delta: |
0.1.29
by Martin Pool
Better internal error |
204 |
assert 0 <= i1 |
205 |
assert i1 <= i2 |
|
206 |
assert i2 <= len(self._l) |
|
0.1.56
by Martin Pool
Handle deletion of lines by marking the region with a deletion |
207 |
|
208 |
# the deletion and insertion are handled separately.
|
|
209 |
# first delete the region.
|
|
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
210 |
if i1 != i2: |
0.1.56
by Martin Pool
Handle deletion of lines by marking the region with a deletion |
211 |
self._l.insert(i1+offset, ('[', idx)) |
212 |
self._l.insert(i2+offset+1, (']', idx)) |
|
213 |
offset += 2 |
|
214 |
# is this OK???
|
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
215 |
|
0.1.56
by Martin Pool
Handle deletion of lines by marking the region with a deletion |
216 |
if newlines: |
0.1.57
by Martin Pool
Fix bug in an update edit that both deletes and inserts -- previously |
217 |
# there may have been a deletion spanning up to
|
218 |
# i2; we want to insert after this region to make sure
|
|
219 |
# we don't destroy ourselves
|
|
220 |
i = i2 + offset |
|
0.1.56
by Martin Pool
Handle deletion of lines by marking the region with a deletion |
221 |
self._l[i:i] = [('{', idx)] \ |
222 |
+ newlines \ |
|
223 |
+ [('}', idx)] |
|
224 |
offset += 2 + len(newlines) |
|
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
225 |
|
0.1.75
by Martin Pool
Remove VerInfo class; just store sets directly in the list of |
226 |
self._addversion(parents) |
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
227 |
else: |
0.1.26
by Martin Pool
Refactor parameters to add command |
228 |
# special case; adding with no parents revision; can do this
|
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
229 |
# more quickly by just appending unconditionally
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
230 |
self._l.append(('{', idx)) |
231 |
self._l += text |
|
232 |
self._l.append(('}', idx)) |
|
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
233 |
|
0.1.75
by Martin Pool
Remove VerInfo class; just store sets directly in the list of |
234 |
self._addversion(None) |
0.1.89
by Martin Pool
Store SHA1 in weave file for later verification |
235 |
|
236 |
self._sha1s.append(sha1) |
|
0.1.25
by Martin Pool
Handle insertion of new weave layers that insert text on top of the basis |
237 |
|
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
238 |
return idx |
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
239 |
|
0.1.27
by Martin Pool
Check that version numbers passed in are reasonable |
240 |
|
0.1.78
by Martin Pool
Rename Weave.get_included to inclusions and getiter to get_iter |
241 |
def inclusions(self, versions): |
242 |
"""Expand out everything included by versions."""
|
|
243 |
i = set(versions) |
|
244 |
for v in versions: |
|
869
by Martin Pool
- more weave.py command line options |
245 |
try: |
246 |
i.update(self._v[v]) |
|
247 |
except IndexError: |
|
248 |
raise ValueError("version %d not present in weave" % v) |
|
0.1.77
by Martin Pool
New Weave.get_included() does transitive expansion |
249 |
return i |
250 |
||
251 |
||
890
by Martin Pool
- weave info should show minimal expression of parents |
252 |
def minimal_parents(self, version): |
253 |
"""Find the minimal set of parents for the version."""
|
|
254 |
included = self._v[version] |
|
255 |
if not included: |
|
256 |
return [] |
|
257 |
||
258 |
li = list(included) |
|
259 |
li.sort() |
|
260 |
li.reverse() |
|
261 |
||
262 |
mininc = [] |
|
263 |
gotit = set() |
|
264 |
||
265 |
for pv in li: |
|
266 |
if pv not in gotit: |
|
267 |
mininc.append(pv) |
|
268 |
gotit.update(self._v[pv]) |
|
269 |
||
270 |
assert mininc[0] >= 0 |
|
271 |
assert mininc[-1] < version |
|
272 |
return mininc |
|
273 |
||
274 |
||
0.1.75
by Martin Pool
Remove VerInfo class; just store sets directly in the list of |
275 |
def _addversion(self, parents): |
276 |
if parents: |
|
277 |
self._v.append(frozenset(parents)) |
|
278 |
else: |
|
279 |
self._v.append(frozenset()) |
|
280 |
||
281 |
||
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
282 |
def _check_lines(self, text): |
283 |
if not isinstance(text, list): |
|
284 |
raise ValueError("text should be a list, not %s" % type(text)) |
|
285 |
||
286 |
for l in text: |
|
287 |
if not isinstance(l, basestring): |
|
869
by Martin Pool
- more weave.py command line options |
288 |
raise ValueError("text line should be a string or unicode, not %s" |
289 |
% type(l)) |
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
290 |
|
291 |
||
292 |
||
0.1.27
by Martin Pool
Check that version numbers passed in are reasonable |
293 |
def _check_versions(self, indexes): |
294 |
"""Check everything in the sequence of indexes is valid"""
|
|
295 |
for i in indexes: |
|
296 |
try: |
|
297 |
self._v[i] |
|
298 |
except IndexError: |
|
299 |
raise IndexError("invalid version number %r" % i) |
|
300 |
||
0.1.2
by Martin Pool
Import testsweet module adapted from bzr. |
301 |
|
0.1.7
by Martin Pool
Add trivial annotate text |
302 |
def annotate(self, index): |
303 |
return list(self.annotate_iter(index)) |
|
304 |
||
305 |
||
0.1.78
by Martin Pool
Rename Weave.get_included to inclusions and getiter to get_iter |
306 |
def annotate_iter(self, version): |
0.1.7
by Martin Pool
Add trivial annotate text |
307 |
"""Yield list of (index-id, line) pairs for the specified version.
|
308 |
||
309 |
The index indicates when the line originated in the weave."""
|
|
0.1.78
by Martin Pool
Rename Weave.get_included to inclusions and getiter to get_iter |
310 |
included = self.inclusions([version]) |
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
311 |
for origin, lineno, text in self._extract(included): |
312 |
yield origin, text |
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
313 |
|
314 |
||
315 |
def _extract(self, included): |
|
0.1.20
by Martin Pool
Factor out Knit.extract() method |
316 |
"""Yield annotation of lines in included set.
|
317 |
||
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
318 |
Yields a sequence of tuples (origin, lineno, text), where
|
319 |
origin is the origin version, lineno the index in the weave,
|
|
320 |
and text the text of the line.
|
|
321 |
||
0.1.20
by Martin Pool
Factor out Knit.extract() method |
322 |
The set typically but not necessarily corresponds to a version.
|
323 |
"""
|
|
881
by Martin Pool
- faster weave extraction |
324 |
|
325 |
istack = [] |
|
326 |
dset = set() |
|
0.1.48
by Martin Pool
Basic parsing of delete instructions. |
327 |
|
328 |
lineno = 0 # line of weave, 0-based |
|
881
by Martin Pool
- faster weave extraction |
329 |
isactive = False |
0.1.85
by Martin Pool
doc |
330 |
|
0.1.63
by Martin Pool
Abbreviate WeaveFormatError in some code |
331 |
WFE = WeaveFormatError |
0.1.95
by Martin Pool
- preliminary merge conflict detection |
332 |
|
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
333 |
for l in self._l: |
334 |
if isinstance(l, tuple): |
|
335 |
c, v = l |
|
881
by Martin Pool
- faster weave extraction |
336 |
if v in included: # only active blocks are interesting |
337 |
if c == '{': |
|
338 |
assert v not in istack |
|
339 |
istack.append(v) |
|
340 |
isactive = not dset |
|
341 |
elif c == '}': |
|
0.1.48
by Martin Pool
Basic parsing of delete instructions. |
342 |
oldv = istack.pop() |
881
by Martin Pool
- faster weave extraction |
343 |
assert oldv == v |
344 |
isactive = istack and not dset |
|
345 |
elif c == '[': |
|
346 |
assert v not in dset |
|
0.1.48
by Martin Pool
Basic parsing of delete instructions. |
347 |
dset.add(v) |
881
by Martin Pool
- faster weave extraction |
348 |
isactive = False |
349 |
else: |
|
350 |
assert c == ']' |
|
351 |
assert v in dset |
|
0.1.48
by Martin Pool
Basic parsing of delete instructions. |
352 |
dset.remove(v) |
881
by Martin Pool
- faster weave extraction |
353 |
isactive = istack and not dset |
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
354 |
else: |
355 |
assert isinstance(l, basestring) |
|
356 |
if isactive: |
|
888
by Martin Pool
- fix refactoring breakage |
357 |
yield istack[-1], lineno, l |
0.1.39
by Martin Pool
Change to a more realistic weave structure which can represent insertions and |
358 |
lineno += 1 |
0.1.7
by Martin Pool
Add trivial annotate text |
359 |
|
0.1.46
by Martin Pool
More constraints on structure of weave, and checks that they work |
360 |
if istack: |
0.1.63
by Martin Pool
Abbreviate WeaveFormatError in some code |
361 |
raise WFE("unclosed insertion blocks at end of weave", |
0.1.47
by Martin Pool
New WeaveError and WeaveFormatError rather than assertions. |
362 |
istack) |
0.1.48
by Martin Pool
Basic parsing of delete instructions. |
363 |
if dset: |
0.1.63
by Martin Pool
Abbreviate WeaveFormatError in some code |
364 |
raise WFE("unclosed deletion blocks at end of weave", |
0.1.48
by Martin Pool
Basic parsing of delete instructions. |
365 |
dset) |
0.1.40
by Martin Pool
Add test for extracting from weave with nested insertions |
366 |
|
0.1.7
by Martin Pool
Add trivial annotate text |
367 |
|
0.1.78
by Martin Pool
Rename Weave.get_included to inclusions and getiter to get_iter |
368 |
def get_iter(self, version): |
0.1.5
by Martin Pool
Add test for storing two text versions. |
369 |
"""Yield lines for the specified version."""
|
0.1.78
by Martin Pool
Rename Weave.get_included to inclusions and getiter to get_iter |
370 |
for origin, lineno, line in self._extract(self.inclusions([version])): |
0.1.8
by Martin Pool
Unify get/annotate code |
371 |
yield line |
0.1.5
by Martin Pool
Add test for storing two text versions. |
372 |
|
373 |
||
0.1.4
by Martin Pool
Start indexing knits by both integer and version string. |
374 |
def get(self, index): |
0.1.78
by Martin Pool
Rename Weave.get_included to inclusions and getiter to get_iter |
375 |
return list(self.get_iter(index)) |
0.1.1
by Martin Pool
Check in old existing knit code. |
376 |
|
377 |
||
0.1.95
by Martin Pool
- preliminary merge conflict detection |
378 |
def mash_iter(self, included): |
0.1.65
by Martin Pool
Add Weave.merge_iter to get automerged lines |
379 |
"""Return composed version of multiple included versions."""
|
380 |
included = frozenset(included) |
|
381 |
for origin, lineno, text in self._extract(included): |
|
382 |
yield text |
|
383 |
||
384 |
||
0.1.11
by Martin Pool
Add Knit.dump method |
385 |
def dump(self, to_file): |
386 |
from pprint import pprint |
|
0.1.38
by Martin Pool
Rename knit to weave. (I don't think there's an existing module called weave.) |
387 |
print >>to_file, "Weave._l = ", |
0.1.11
by Martin Pool
Add Knit.dump method |
388 |
pprint(self._l, to_file) |
0.1.38
by Martin Pool
Rename knit to weave. (I don't think there's an existing module called weave.) |
389 |
print >>to_file, "Weave._v = ", |
0.1.18
by Martin Pool
Better Knit.dump method |
390 |
pprint(self._v, to_file) |
0.1.11
by Martin Pool
Add Knit.dump method |
391 |
|
392 |
||
0.1.91
by Martin Pool
Update Weave.check |
393 |
|
394 |
def numversions(self): |
|
395 |
l = len(self._v) |
|
396 |
assert l == len(self._sha1s) |
|
397 |
return l |
|
398 |
||
399 |
||
0.1.13
by Martin Pool
Knit structure now allows for versions to include the lines present in other |
400 |
def check(self): |
0.1.91
by Martin Pool
Update Weave.check |
401 |
# check no circular inclusions
|
402 |
for version in range(self.numversions()): |
|
403 |
inclusions = list(self._v[version]) |
|
404 |
if inclusions: |
|
405 |
inclusions.sort() |
|
406 |
if inclusions[-1] >= version: |
|
0.1.47
by Martin Pool
New WeaveError and WeaveFormatError rather than assertions. |
407 |
raise WeaveFormatError("invalid included version %d for index %d" |
0.1.91
by Martin Pool
Update Weave.check |
408 |
% (inclusions[-1], version)) |
409 |
||
410 |
# try extracting all versions; this is a bit slow and parallel
|
|
411 |
# extraction could be used
|
|
412 |
import sha |
|
413 |
for version in range(self.numversions()): |
|
414 |
s = sha.new() |
|
415 |
for l in self.get_iter(version): |
|
416 |
s.update(l) |
|
417 |
hd = s.hexdigest() |
|
418 |
expected = self._sha1s[version] |
|
419 |
if hd != expected: |
|
420 |
raise WeaveError("mismatched sha1 for version %d; " |
|
421 |
"got %s, expected %s" |
|
422 |
% (version, hd, expected)) |
|
0.1.18
by Martin Pool
Better Knit.dump method |
423 |
|
881
by Martin Pool
- faster weave extraction |
424 |
# TODO: check insertions are properly nested, that there are
|
425 |
# no lines outside of insertion blocks, that deletions are
|
|
426 |
# properly paired, etc.
|
|
427 |
||
0.1.13
by Martin Pool
Knit structure now allows for versions to include the lines present in other |
428 |
|
429 |
||
0.1.95
by Martin Pool
- preliminary merge conflict detection |
430 |
def merge(self, merge_versions): |
431 |
"""Automerge and mark conflicts between versions.
|
|
432 |
||
433 |
This returns a sequence, each entry describing alternatives
|
|
434 |
for a chunk of the file. Each of the alternatives is given as
|
|
435 |
a list of lines.
|
|
436 |
||
437 |
If there is a chunk of the file where there's no diagreement,
|
|
438 |
only one alternative is given.
|
|
439 |
"""
|
|
440 |
||
441 |
# approach: find the included versions common to all the
|
|
442 |
# merged versions
|
|
443 |
raise NotImplementedError() |
|
444 |
||
445 |
||
446 |
||
0.1.21
by Martin Pool
Start computing a delta to insert a new revision |
447 |
def _delta(self, included, lines): |
448 |
"""Return changes from basis to new revision.
|
|
449 |
||
450 |
The old text for comparison is the union of included revisions.
|
|
451 |
||
452 |
This is used in inserting a new text.
|
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
453 |
|
0.1.55
by Martin Pool
doc |
454 |
Delta is returned as a sequence of
|
455 |
(weave1, weave2, newlines).
|
|
456 |
||
457 |
This indicates that weave1:weave2 of the old weave should be
|
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
458 |
replaced by the sequence of lines in newlines. Note that
|
459 |
these line numbers are positions in the total weave and don't
|
|
460 |
correspond to the lines in any extracted version, or even the
|
|
461 |
extracted union of included versions.
|
|
462 |
||
463 |
If line1=line2, this is a pure insert; if newlines=[] this is a
|
|
464 |
pure delete. (Similar to difflib.)
|
|
0.1.21
by Martin Pool
Start computing a delta to insert a new revision |
465 |
"""
|
0.1.54
by Martin Pool
Fix weave line calculation when making deltas |
466 |
# basis a list of (origin, lineno, line)
|
0.1.84
by Martin Pool
Refactor Weave._delta to calculate less unused information |
467 |
basis_lineno = [] |
0.1.83
by Martin Pool
Better delta basis calculation |
468 |
basis_lines = [] |
0.1.84
by Martin Pool
Refactor Weave._delta to calculate less unused information |
469 |
for origin, lineno, line in self._extract(included): |
470 |
basis_lineno.append(lineno) |
|
471 |
basis_lines.append(line) |
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
472 |
|
473 |
# add a sentinal, because we can also match against the final line
|
|
0.1.84
by Martin Pool
Refactor Weave._delta to calculate less unused information |
474 |
basis_lineno.append(len(self._l)) |
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
475 |
|
0.1.63
by Martin Pool
Abbreviate WeaveFormatError in some code |
476 |
# XXX: which line of the weave should we really consider
|
477 |
# matches the end of the file? the current code says it's the
|
|
478 |
# last line of the weave?
|
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
479 |
|
480 |
from difflib import SequenceMatcher |
|
481 |
s = SequenceMatcher(None, basis_lines, lines) |
|
482 |
||
0.1.55
by Martin Pool
doc |
483 |
# TODO: Perhaps return line numbers from composed weave as well?
|
484 |
||
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
485 |
for tag, i1, i2, j1, j2 in s.get_opcodes(): |
0.1.23
by Martin Pool
tidy up |
486 |
##print tag, i1, i2, j1, j2
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
487 |
|
488 |
if tag == 'equal': |
|
489 |
continue
|
|
490 |
||
491 |
# i1,i2 are given in offsets within basis_lines; we need to map them
|
|
492 |
# back to offsets within the entire weave
|
|
0.1.84
by Martin Pool
Refactor Weave._delta to calculate less unused information |
493 |
real_i1 = basis_lineno[i1] |
494 |
real_i2 = basis_lineno[i2] |
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
495 |
|
0.1.35
by Martin Pool
Clean up Knit._delta method |
496 |
assert 0 <= j1 |
497 |
assert j1 <= j2 |
|
498 |
assert j2 <= len(lines) |
|
0.1.22
by Martin Pool
Calculate delta for new versions relative to a set of parent versions. |
499 |
|
0.1.35
by Martin Pool
Clean up Knit._delta method |
500 |
yield real_i1, real_i2, lines[j1:j2] |
0.1.21
by Martin Pool
Start computing a delta to insert a new revision |
501 |
|
0.1.1
by Martin Pool
Check in old existing knit code. |
502 |
|
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
503 |
|
0.1.88
by Martin Pool
Add weave info command. |
504 |
def weave_info(filename, out): |
505 |
"""Show some text information about the weave."""
|
|
506 |
from weavefile import read_weave |
|
507 |
wf = file(filename, 'rb') |
|
508 |
w = read_weave(wf) |
|
509 |
# FIXME: doesn't work on pipes
|
|
510 |
weave_size = wf.tell() |
|
511 |
print >>out, "weave file size %d bytes" % weave_size |
|
512 |
print >>out, "weave contains %d versions" % len(w._v) |
|
513 |
||
514 |
total = 0 |
|
870
by Martin Pool
- better weave info display |
515 |
print '%6s %6s %8s %40s %20s' % ('ver', 'lines', 'bytes', 'sha1', 'parents') |
516 |
for i in (6, 6, 8, 40, 20): |
|
517 |
print '-' * i, |
|
518 |
print
|
|
0.1.88
by Martin Pool
Add weave info command. |
519 |
for i in range(len(w._v)): |
520 |
text = w.get(i) |
|
521 |
lines = len(text) |
|
522 |
bytes = sum((len(a) for a in text)) |
|
0.1.91
by Martin Pool
Update Weave.check |
523 |
sha1 = w._sha1s[i] |
870
by Martin Pool
- better weave info display |
524 |
print '%6d %6d %8d %40s' % (i, lines, bytes, sha1), |
890
by Martin Pool
- weave info should show minimal expression of parents |
525 |
print ', '.join(map(str, w.minimal_parents(i))) |
0.1.88
by Martin Pool
Add weave info command. |
526 |
total += bytes |
527 |
||
528 |
print >>out, "versions total %d bytes" % total |
|
529 |
print >>out, "compression ratio %.3f" % (float(total)/float(weave_size)) |
|
869
by Martin Pool
- more weave.py command line options |
530 |
|
531 |
||
532 |
def usage(): |
|
871
by Martin Pool
- add command for merge-based weave |
533 |
print """bzr weave tool |
534 |
||
535 |
Experimental tool for weave algorithm.
|
|
536 |
||
869
by Martin Pool
- more weave.py command line options |
537 |
usage:
|
538 |
weave init WEAVEFILE
|
|
539 |
Create an empty weave file
|
|
540 |
weave get WEAVEFILE VERSION
|
|
541 |
Write out specified version.
|
|
542 |
weave check WEAVEFILE
|
|
543 |
Check consistency of all versions.
|
|
544 |
weave info WEAVEFILE
|
|
545 |
Display table of contents.
|
|
546 |
weave add WEAVEFILE [BASE...] < NEWTEXT
|
|
547 |
Add NEWTEXT, with specified parent versions.
|
|
548 |
weave annotate WEAVEFILE VERSION
|
|
549 |
Display origin of each line.
|
|
550 |
weave mash WEAVEFILE VERSION...
|
|
551 |
Display composite of all selected versions.
|
|
552 |
weave merge WEAVEFILE VERSION1 VERSION2 > OUT
|
|
553 |
Auto-merge two versions and display conflicts.
|
|
871
by Martin Pool
- add command for merge-based weave |
554 |
|
555 |
example:
|
|
556 |
||
557 |
% weave init foo.weave
|
|
558 |
% vi foo.txt
|
|
559 |
% weave add foo.weave < foo.txt
|
|
560 |
added version 0
|
|
561 |
||
562 |
(create updated version)
|
|
563 |
% vi foo.txt
|
|
564 |
% weave get foo.weave 0 | diff -u - foo.txt
|
|
565 |
% weave add foo.weave 0 < foo.txt
|
|
566 |
added version 1
|
|
567 |
||
568 |
% weave get foo.weave 0 > foo.txt (create forked version)
|
|
569 |
% vi foo.txt
|
|
570 |
% weave add foo.weave 0 < foo.txt
|
|
571 |
added version 2
|
|
572 |
||
573 |
% weave merge foo.weave 1 2 > foo.txt (merge them)
|
|
574 |
% vi foo.txt (resolve conflicts)
|
|
575 |
% weave add foo.weave 1 2 < foo.txt (commit merged version)
|
|
576 |
|
|
869
by Martin Pool
- more weave.py command line options |
577 |
"""
|
0.1.88
by Martin Pool
Add weave info command. |
578 |
|
579 |
||
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
580 |
|
581 |
def main(argv): |
|
582 |
import sys |
|
583 |
import os |
|
869
by Martin Pool
- more weave.py command line options |
584 |
from weavefile import write_weave, read_weave |
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
585 |
cmd = argv[1] |
869
by Martin Pool
- more weave.py command line options |
586 |
|
587 |
def readit(): |
|
588 |
return read_weave(file(argv[2], 'rb')) |
|
589 |
||
590 |
if cmd == 'help': |
|
591 |
usage() |
|
592 |
elif cmd == 'add': |
|
593 |
w = readit() |
|
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
594 |
# at the moment, based on everything in the file
|
869
by Martin Pool
- more weave.py command line options |
595 |
parents = map(int, argv[3:]) |
0.1.72
by Martin Pool
Go back to weave lines normally having newlines at the end. |
596 |
lines = sys.stdin.readlines() |
0.1.69
by Martin Pool
Simple text-based format for storing weaves, cleaner than |
597 |
ver = w.add(parents, lines) |
869
by Martin Pool
- more weave.py command line options |
598 |
write_weave(w, file(argv[2], 'wb')) |
599 |
print 'added version %d' % ver |
|
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
600 |
elif cmd == 'init': |
601 |
fn = argv[2] |
|
602 |
if os.path.exists(fn): |
|
603 |
raise IOError("file exists") |
|
604 |
w = Weave() |
|
869
by Martin Pool
- more weave.py command line options |
605 |
write_weave(w, file(fn, 'wb')) |
606 |
elif cmd == 'get': # get one version |
|
607 |
w = readit() |
|
0.1.94
by Martin Pool
Fix get_iter call |
608 |
sys.stdout.writelines(w.get_iter(int(argv[3]))) |
869
by Martin Pool
- more weave.py command line options |
609 |
|
610 |
elif cmd == 'mash': # get composite |
|
611 |
w = readit() |
|
612 |
sys.stdout.writelines(w.mash_iter(map(int, argv[3:]))) |
|
613 |
||
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
614 |
elif cmd == 'annotate': |
869
by Martin Pool
- more weave.py command line options |
615 |
w = readit() |
0.1.72
by Martin Pool
Go back to weave lines normally having newlines at the end. |
616 |
# newline is added to all lines regardless; too hard to get
|
617 |
# reasonable formatting otherwise
|
|
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
618 |
lasto = None |
619 |
for origin, text in w.annotate(int(argv[3])): |
|
0.1.72
by Martin Pool
Go back to weave lines normally having newlines at the end. |
620 |
text = text.rstrip('\r\n') |
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
621 |
if origin == lasto: |
622 |
print ' | %s' % (text) |
|
623 |
else: |
|
624 |
print '%5d | %s' % (origin, text) |
|
625 |
lasto = origin |
|
871
by Martin Pool
- add command for merge-based weave |
626 |
|
0.1.88
by Martin Pool
Add weave info command. |
627 |
elif cmd == 'info': |
628 |
weave_info(argv[2], sys.stdout) |
|
871
by Martin Pool
- add command for merge-based weave |
629 |
|
0.1.91
by Martin Pool
Update Weave.check |
630 |
elif cmd == 'check': |
869
by Martin Pool
- more weave.py command line options |
631 |
w = readit() |
0.1.91
by Martin Pool
Update Weave.check |
632 |
w.check() |
871
by Martin Pool
- add command for merge-based weave |
633 |
|
634 |
elif cmd == 'merge': |
|
635 |
if len(argv) != 5: |
|
636 |
usage() |
|
637 |
return 1 |
|
638 |
||
639 |
w = readit() |
|
640 |
v1, v2 = map(int, argv[3:5]) |
|
641 |
||
642 |
basis = w.inclusions([v1]).intersection(w.inclusions([v2])) |
|
643 |
||
644 |
base_lines = list(w.mash_iter(basis)) |
|
645 |
a_lines = list(w.get(v1)) |
|
646 |
b_lines = list(w.get(v2)) |
|
647 |
||
648 |
from bzrlib.merge3 import Merge3 |
|
649 |
m3 = Merge3(base_lines, a_lines, b_lines) |
|
650 |
||
651 |
name_a = 'version %d' % v1 |
|
652 |
name_b = 'version %d' % v2 |
|
653 |
sys.stdout.writelines(m3.merge_lines(name_a=name_a, name_b=name_b)) |
|
0.1.62
by Martin Pool
Lame command-line client for reading and writing weaves. |
654 |
else: |
655 |
raise ValueError('unknown command %r' % cmd) |
|
656 |
||
657 |
||
658 |
if __name__ == '__main__': |
|
659 |
import sys |
|
660 |
sys.exit(main(sys.argv)) |