23
25
from cStringIO import StringIO
24
from warnings import warn
30
28
from bzrlib.weavefile import read_weave, write_weave_v5
31
from bzrlib.weave import WeaveFile, Weave
32
from bzrlib.store import TransportStore
29
from bzrlib.weave import Weave
30
from bzrlib.store import TransportStore, hash_prefix
33
31
from bzrlib.atomicfile import AtomicFile
34
from bzrlib.symbol_versioning import (deprecated_method,
32
from bzrlib.errors import NoSuchFile, FileExists
36
33
from bzrlib.trace import mutter
40
class VersionedFileStore(TransportStore):
41
"""Collection of many versioned files in a transport."""
43
# TODO: Rather than passing versionedfile_kwargs, perhaps pass in a
44
# transport factory callable?
45
def __init__(self, transport, prefixed=False, precious=False,
46
dir_mode=None, file_mode=None,
47
versionedfile_class=WeaveFile,
48
versionedfile_kwargs={},
50
super(VersionedFileStore, self).__init__(transport,
51
dir_mode=dir_mode, file_mode=file_mode,
52
prefixed=prefixed, compressed=False, escaped=escaped)
36
class WeaveStore(TransportStore):
37
"""Collection of several weave files in a directory.
39
This has some shortcuts for reading and writing them.
41
FILE_SUFFIX = '.weave'
43
def __init__(self, transport, prefixed=False, precious=False):
44
self._transport = transport
45
self._prefixed = prefixed
53
46
self._precious = precious
54
self._versionedfile_class = versionedfile_class
55
self._versionedfile_kwargs = versionedfile_kwargs
56
# Used for passing get_scope to versioned file constructors;
59
48
def filename(self, file_id):
60
49
"""Return the path relative to the transport root."""
61
return self._relpath(file_id)
51
return hash_prefix(file_id) + urllib.quote(file_id) + WeaveStore.FILE_SUFFIX
53
return urllib.quote(file_id) + WeaveStore.FILE_SUFFIX
63
55
def __iter__(self):
64
suffixes = self._versionedfile_class.get_suffixes()
56
l = len(WeaveStore.FILE_SUFFIX)
66
57
for relpath in self._iter_files_recursive():
67
for suffix in suffixes:
68
if relpath.endswith(suffix):
69
# TODO: use standard remove_suffix function
70
escaped_id = os.path.basename(relpath[:-len(suffix)])
71
file_id = self._mapper.unmap(escaped_id)[0]
72
if file_id not in ids:
75
break # only one suffix can match
77
def has_id(self, file_id):
78
suffixes = self._versionedfile_class.get_suffixes()
79
filename = self.filename(file_id)
80
for suffix in suffixes:
81
if not self._transport.has(filename + suffix):
85
def get_empty(self, file_id, transaction):
86
"""Get an empty weave, which implies deleting the existing one first."""
87
if self.has_id(file_id):
88
self.delete(file_id, transaction)
89
return self.get_weave_or_empty(file_id, transaction)
91
def delete(self, file_id, transaction):
92
"""Remove file_id from the store."""
93
suffixes = self._versionedfile_class.get_suffixes()
94
filename = self.filename(file_id)
95
for suffix in suffixes:
96
self._transport.delete(filename + suffix)
58
if relpath.endswith(WeaveStore.FILE_SUFFIX):
59
yield os.path.basename(relpath[:-l])
61
def has_id(self, fileid):
62
return self._transport.has(self.filename(fileid))
98
64
def _get(self, file_id):
99
65
return self._transport.get(self.filename(file_id))
101
67
def _put(self, file_id, f):
102
fn = self.filename(file_id)
104
return self._transport.put_file(fn, f, mode=self._file_mode)
105
except errors.NoSuchFile:
106
if not self._prefixed:
108
self._transport.mkdir(os.path.dirname(fn), mode=self._dir_mode)
109
return self._transport.put_file(fn, f, mode=self._file_mode)
111
def get_weave(self, file_id, transaction, _filename=None):
112
"""Return the VersionedFile for file_id.
114
:param _filename: filename that would be returned from self.filename for
115
file_id. This is used to reduce duplicate filename calculations when
116
using 'get_weave_or_empty'. FOR INTERNAL USE ONLY.
118
if _filename is None:
119
_filename = self.filename(file_id)
120
if transaction.writeable():
121
w = self._versionedfile_class(_filename, self._transport, self._file_mode,
122
get_scope=self.get_scope, **self._versionedfile_kwargs)
124
w = self._versionedfile_class(_filename,
129
get_scope=self.get_scope,
130
**self._versionedfile_kwargs)
70
self._transport.mkdir(hash_prefix(file_id))
73
return self._transport.put(self.filename(file_id), f)
75
def get_weave(self, file_id, transaction):
76
weave = transaction.map.find_weave(file_id)
78
mutter("cache hit in %s for %s", self, file_id)
80
w = read_weave(self._get(file_id))
81
transaction.map.add_weave(file_id, w)
82
transaction.register_clean(w, precious=self._precious)
133
def _make_new_versionedfile(self, file_id, transaction,
134
known_missing=False, _filename=None):
135
"""Make a new versioned file.
137
:param _filename: filename that would be returned from self.filename for
138
file_id. This is used to reduce duplicate filename calculations when
139
using 'get_weave_or_empty'. FOR INTERNAL USE ONLY.
141
if not known_missing and self.has_id(file_id):
142
self.delete(file_id, transaction)
143
if _filename is None:
144
_filename = self.filename(file_id)
146
# we try without making the directory first because thats optimising
147
# for the common case.
148
weave = self._versionedfile_class(_filename, self._transport, self._file_mode, create=True,
149
get_scope=self.get_scope, **self._versionedfile_kwargs)
150
except errors.NoSuchFile:
151
if not self._prefixed:
152
# unexpected error - NoSuchFile is expected to be raised on a
153
# missing dir only and that only occurs when we are prefixed.
155
dirname = osutils.dirname(_filename)
156
self._transport.mkdir(dirname, mode=self._dir_mode)
157
weave = self._versionedfile_class(_filename, self._transport,
158
self._file_mode, create=True,
159
get_scope=self.get_scope,
160
**self._versionedfile_kwargs)
85
def get_lines(self, file_id, rev_id, transaction):
86
"""Return text from a particular version of a weave.
88
Returned as a list of lines."""
89
w = self.get_weave(file_id, transaction)
90
return w.get(w.lookup(rev_id))
163
92
def get_weave_or_empty(self, file_id, transaction):
164
"""Return a weave, or an empty one if it doesn't exist."""
165
# This is typically used from 'commit' and 'fetch/push/pull' where
166
# we scan across many versioned files once. As such the small overhead
167
# of calculating the filename before doing a cache lookup is more than
168
# compensated for by not calculating the filename when making new
170
_filename = self.filename(file_id)
93
"""Return a weave, or an empty one if it doesn't exist."""
172
return self.get_weave(file_id, transaction, _filename=_filename)
173
except errors.NoSuchFile:
174
weave = self._make_new_versionedfile(file_id, transaction,
175
known_missing=True, _filename=_filename)
95
return self.get_weave(file_id, transaction)
97
weave = Weave(weave_name=file_id)
98
transaction.map.add_weave(file_id, weave)
99
transaction.register_clean(weave, precious=self._precious)
178
def _put_weave(self, file_id, weave, transaction):
179
"""Preserved here for upgrades-to-weaves to use."""
180
myweave = self._make_new_versionedfile(file_id, transaction)
181
myweave.insert_record_stream(weave.get_record_stream(
182
[(version,) for version in weave.versions()],
183
'topological', False))
185
def copy_all_ids(self, store_from, pb=None, from_transaction=None,
186
to_transaction=None):
187
"""Copy all the file ids from store_from into self."""
188
if from_transaction is None:
189
warn("Please pass from_transaction into "
190
"versioned_store.copy_all_ids.", stacklevel=2)
191
if to_transaction is None:
192
warn("Please pass to_transaction into "
193
"versioned_store.copy_all_ids.", stacklevel=2)
194
if not store_from.listable():
195
raise errors.UnlistableStore(store_from)
197
for count, file_id in enumerate(store_from):
199
pb.update('listing files', count, count)
203
mutter('copy_all ids: %r', ids)
204
self.copy_multi(store_from, ids, pb=pb,
205
from_transaction=from_transaction,
206
to_transaction=to_transaction)
208
def copy_multi(self, from_store, file_ids, pb=None, from_transaction=None,
209
to_transaction=None):
210
"""Copy all the versions for multiple file_ids from from_store.
212
:param from_transaction: required current transaction in from_store.
214
from bzrlib.transactions import PassThroughTransaction
215
if from_transaction is None:
216
warn("WeaveStore.copy_multi without a from_transaction parameter "
217
"is deprecated. Please provide a from_transaction.",
220
# we are reading one object - caching is irrelevant.
221
from_transaction = PassThroughTransaction()
222
if to_transaction is None:
223
warn("WeaveStore.copy_multi without a to_transaction parameter "
224
"is deprecated. Please provide a to_transaction.",
227
# we are copying single objects, and there may be open tranasactions
228
# so again with the passthrough
229
to_transaction = PassThroughTransaction()
230
pb = bzrlib.ui.ui_factory.nested_progress_bar()
232
for count, f in enumerate(file_ids):
233
mutter("copy weave {%s} into %s", f, self)
234
pb.update('copy', count, len(file_ids))
235
# if we have it in cache, its faster.
236
# joining is fast with knits, and bearable for weaves -
237
# indeed the new case can be optimised if needed.
238
target = self._make_new_versionedfile(f, to_transaction)
239
source = from_store.get_weave(f, from_transaction)
240
target.insert_record_stream(source.get_record_stream(
241
[(version,) for version in source.versions()],
242
'topological', False))
246
def total_size(self):
247
count, bytes = super(VersionedFileStore, self).total_size()
248
return (count / len(self._versionedfile_class.get_suffixes())), bytes
250
WeaveStore = VersionedFileStore
102
def put_weave(self, file_id, weave, transaction):
103
"""Write back a modified weave"""
104
transaction.register_dirty(weave)
105
# TODO FOR WRITE TRANSACTIONS: this should be done in a callback
106
# from the transaction, when it decides to save.
108
write_weave_v5(weave, sio)
110
self._put(file_id, sio)
112
def add_text(self, file_id, rev_id, new_lines, parents, transaction):
113
w = self.get_weave_or_empty(file_id, transaction)
114
parent_idxs = map(w.lookup, parents)
115
w.add(rev_id, parent_idxs, new_lines)
116
self.put_weave(file_id, w, transaction)
118
def add_identical_text(self, file_id, old_rev_id, new_rev_id, parents,
120
w = self.get_weave_or_empty(file_id, transaction)
121
parent_idxs = map(w.lookup, parents)
122
w.add_identical(old_rev_id, new_rev_id, parent_idxs)
123
self.put_weave(file_id, w, transaction)
125
def copy_multi(self, from_store, file_ids):
126
assert isinstance(from_store, WeaveStore)
128
mutter("copy weave {%s} into %s", f, self)
129
self._put(f, from_store._get(f))