199
262
def _count_log_matches(self, target, logs):
200
263
"""Count the number of times the target file pattern was fetched in an http log"""
201
log_pattern = '%s HTTP/1.1" 200 - "-" "bzr/%s' % \
202
(target, bzrlib.__version__)
264
get_succeeds_re = re.compile(
265
'.*"GET .*%s HTTP/1.1" 20[06] - "-" "bzr/%s' %
266
( target, bzrlib.__version__))
204
268
for line in logs:
205
# TODO: perhaps use a regexp instead so we can match more
207
if line.find(log_pattern) > -1:
269
if get_succeeds_re.match(line):
211
273
def test_weaves_are_retrieved_once(self):
212
274
self.build_tree(("source/", "source/file", "target/"))
213
wt = self.make_branch_and_tree('source')
275
# This test depends on knit dasta storage.
276
wt = self.make_branch_and_tree('source', format='dirstate-tags')
214
277
branch = wt.branch
215
278
wt.add(["file"], ["id"])
216
279
wt.commit("added file")
217
print >>open("source/file", 'w'), "blah"
280
open("source/file", 'w').write("blah\n")
218
281
wt.commit("changed file")
219
282
target = BzrDir.create_branch_and_repo("target/")
220
283
source = Branch.open(self.get_readonly_url("source/"))
221
self.assertEqual(target.fetch(source), (2, []))
222
log_pattern = '%%s HTTP/1.1" 200 - "-" "bzr/%s' % bzrlib.__version__
223
# this is the path to the literal file. As format changes
285
# this is the path to the literal file. As format changes
224
286
# occur it needs to be updated. FIXME: ask the store for the
226
288
self.log("web server logs are:")
227
289
http_logs = self.get_readonly_server().logs
228
290
self.log('\n'.join(http_logs))
229
# unfortunately this log entry is branch format specific. We could
230
# factor out the 'what files does this format use' to a method on the
291
# unfortunately this log entry is branch format specific. We could
292
# factor out the 'what files does this format use' to a method on the
231
293
# repository, which would let us to this generically. RBC 20060419
294
# RBC 20080408: Or perhaps we can assert that no files are fully read
232
296
self.assertEqual(1, self._count_log_matches('/ce/id.kndx', http_logs))
233
297
self.assertEqual(1, self._count_log_matches('/ce/id.knit', http_logs))
234
298
self.assertEqual(1, self._count_log_matches('inventory.kndx', http_logs))
235
# this r-h check test will prevent regressions, but it currently already
299
# this r-h check test will prevent regressions, but it currently already
236
300
# passes, before the patch to cache-rh is applied :[
237
self.assertEqual(1, self._count_log_matches('revision-history', http_logs))
301
self.assertTrue(1 >= self._count_log_matches('revision-history',
303
self.assertTrue(1 >= self._count_log_matches('last-revision',
238
305
# FIXME naughty poking in there.
239
306
self.get_readonly_server().logs = []
240
# check there is nothing more to fetch
241
source = Branch.open(self.get_readonly_url("source/"))
242
self.assertEqual(target.fetch(source), (0, []))
307
# check there is nothing more to fetch. We take care to re-use the
308
# existing transport so that the request logs we're about to examine
309
# aren't cluttered with redundant probes for a smart server.
310
# XXX: Perhaps this further parameterisation: test http with smart
311
# server, and test http without smart server?
312
source = Branch.open(
313
self.get_readonly_url("source/"),
314
possible_transports=[source.bzrdir.root_transport])
243
316
# should make just two requests
244
317
http_logs = self.get_readonly_server().logs
245
318
self.log("web server logs are:")
246
319
self.log('\n'.join(http_logs))
247
320
self.assertEqual(1, self._count_log_matches('branch-format', http_logs))
248
321
self.assertEqual(1, self._count_log_matches('branch/format', http_logs))
249
self.assertEqual(1, self._count_log_matches('repository/format', http_logs))
250
self.assertEqual(1, self._count_log_matches('revision-history', http_logs))
251
self.assertEqual(4, len(http_logs))
322
self.assertEqual(1, self._count_log_matches('repository/format',
324
self.assertEqual(1, self._count_log_matches('revisions.kndx',
326
self.assertTrue(1 >= self._count_log_matches('revision-history',
328
self.assertTrue(1 >= self._count_log_matches('last-revision',
330
self.assertLength(5, http_logs)
333
class TestKnitToPackFetch(TestCaseWithTransport):
335
def find_get_record_stream(self, calls, expected_count=1):
336
"""In a list of calls, find the last 'get_record_stream'.
338
:param expected_count: The number of calls we should exepect to find.
339
If a different number is found, an assertion is raised.
341
get_record_call = None
344
if call[0] == 'get_record_stream':
346
get_record_call = call
347
self.assertEqual(expected_count, call_count)
348
return get_record_call
350
def test_fetch_with_deltas_no_delta_closure(self):
351
tree = self.make_branch_and_tree('source', format='dirstate')
352
target = self.make_repository('target', format='pack-0.92')
353
self.build_tree(['source/file'])
354
tree.set_root_id('root-id')
355
tree.add('file', 'file-id')
356
tree.commit('one', rev_id='rev-one')
357
source = tree.branch.repository
358
source.texts = versionedfile.RecordingVersionedFilesDecorator(
360
source.signatures = versionedfile.RecordingVersionedFilesDecorator(
362
source.revisions = versionedfile.RecordingVersionedFilesDecorator(
364
source.inventories = versionedfile.RecordingVersionedFilesDecorator(
367
self.assertTrue(target._format._fetch_uses_deltas)
368
target.fetch(source, revision_id='rev-one')
369
self.assertEqual(('get_record_stream', [('file-id', 'rev-one')],
370
target._format._fetch_order, False),
371
self.find_get_record_stream(source.texts.calls))
372
self.assertEqual(('get_record_stream', [('rev-one',)],
373
target._format._fetch_order, False),
374
self.find_get_record_stream(source.inventories.calls, 2))
375
self.assertEqual(('get_record_stream', [('rev-one',)],
376
target._format._fetch_order, False),
377
self.find_get_record_stream(source.revisions.calls))
378
# XXX: Signatures is special, and slightly broken. The
379
# standard item_keys_introduced_by actually does a lookup for every
380
# signature to see if it exists, rather than waiting to do them all at
381
# once at the end. The fetch code then does an all-at-once and just
382
# allows for some of them to be missing.
383
# So we know there will be extra calls, but the *last* one is the one
385
signature_calls = source.signatures.calls[-1:]
386
self.assertEqual(('get_record_stream', [('rev-one',)],
387
target._format._fetch_order, False),
388
self.find_get_record_stream(signature_calls))
390
def test_fetch_no_deltas_with_delta_closure(self):
391
tree = self.make_branch_and_tree('source', format='dirstate')
392
target = self.make_repository('target', format='pack-0.92')
393
self.build_tree(['source/file'])
394
tree.set_root_id('root-id')
395
tree.add('file', 'file-id')
396
tree.commit('one', rev_id='rev-one')
397
source = tree.branch.repository
398
source.texts = versionedfile.RecordingVersionedFilesDecorator(
400
source.signatures = versionedfile.RecordingVersionedFilesDecorator(
402
source.revisions = versionedfile.RecordingVersionedFilesDecorator(
404
source.inventories = versionedfile.RecordingVersionedFilesDecorator(
406
# XXX: This won't work in general, but for the dirstate format it does.
407
old_fetch_uses_deltas_setting = target._format._fetch_uses_deltas
409
target._format._fetch_uses_deltas = old_fetch_uses_deltas_setting
410
self.addCleanup(restore)
411
target._format._fetch_uses_deltas = False
412
target.fetch(source, revision_id='rev-one')
413
self.assertEqual(('get_record_stream', [('file-id', 'rev-one')],
414
target._format._fetch_order, True),
415
self.find_get_record_stream(source.texts.calls))
416
self.assertEqual(('get_record_stream', [('rev-one',)],
417
target._format._fetch_order, True),
418
self.find_get_record_stream(source.inventories.calls, 2))
419
self.assertEqual(('get_record_stream', [('rev-one',)],
420
target._format._fetch_order, True),
421
self.find_get_record_stream(source.revisions.calls))
422
# XXX: Signatures is special, and slightly broken. The
423
# standard item_keys_introduced_by actually does a lookup for every
424
# signature to see if it exists, rather than waiting to do them all at
425
# once at the end. The fetch code then does an all-at-once and just
426
# allows for some of them to be missing.
427
# So we know there will be extra calls, but the *last* one is the one
429
signature_calls = source.signatures.calls[-1:]
430
self.assertEqual(('get_record_stream', [('rev-one',)],
431
target._format._fetch_order, True),
432
self.find_get_record_stream(signature_calls))
434
def test_fetch_revisions_with_deltas_into_pack(self):
435
# See BUG #261339, dev versions of bzr could accidentally create deltas
436
# in revision texts in knit branches (when fetching from packs). So we
437
# ensure that *if* a knit repository has a delta in revisions, that it
438
# gets properly expanded back into a fulltext when stored in the pack
440
tree = self.make_branch_and_tree('source', format='dirstate')
441
target = self.make_repository('target', format='pack-0.92')
442
self.build_tree(['source/file'])
443
tree.set_root_id('root-id')
444
tree.add('file', 'file-id')
445
tree.commit('one', rev_id='rev-one')
446
# Hack the KVF for revisions so that it "accidentally" allows a delta
447
tree.branch.repository.revisions._max_delta_chain = 200
448
tree.commit('two', rev_id='rev-two')
449
source = tree.branch.repository
450
# Ensure that we stored a delta
452
self.addCleanup(source.unlock)
453
record = source.revisions.get_record_stream([('rev-two',)],
454
'unordered', False).next()
455
self.assertEqual('knit-delta-gz', record.storage_kind)
456
target.fetch(tree.branch.repository, revision_id='rev-two')
457
# The record should get expanded back to a fulltext
459
self.addCleanup(target.unlock)
460
record = target.revisions.get_record_stream([('rev-two',)],
461
'unordered', False).next()
462
self.assertEqual('knit-ft-gz', record.storage_kind)
464
def test_fetch_with_fallback_and_merge(self):
465
builder = self.make_branch_builder('source', format='pack-0.92')
466
builder.start_series()
477
# A & B are present in the base (stacked-on) repository, A-E are
478
# present in the source.
479
# This reproduces bug #304841
480
# We need a large enough inventory that total size of compressed deltas
481
# is shorter than the size of a compressed fulltext. We have to use
482
# random ids because otherwise the inventory fulltext compresses too
483
# well and the deltas get bigger.
485
('add', ('', 'TREE_ROOT', 'directory', None))]
487
fname = 'file%03d' % (i,)
488
fileid = '%s-%s' % (fname, osutils.rand_chars(64))
489
to_add.append(('add', (fname, fileid, 'file', 'content\n')))
490
builder.build_snapshot('A', None, to_add)
491
builder.build_snapshot('B', ['A'], [])
492
builder.build_snapshot('C', ['A'], [])
493
builder.build_snapshot('D', ['C'], [])
494
builder.build_snapshot('E', ['D'], [])
495
builder.build_snapshot('F', ['E', 'B'], [])
496
builder.finish_series()
497
source_branch = builder.get_branch()
498
source_branch.bzrdir.sprout('base', revision_id='B')
499
target_branch = self.make_branch('target', format='1.6')
500
target_branch.set_stacked_on_url('../base')
501
source = source_branch.repository
503
self.addCleanup(source.unlock)
504
source.inventories = versionedfile.OrderingVersionedFilesDecorator(
506
key_priority={('E',): 1, ('D',): 2, ('C',): 4,
508
# Ensure that the content is yielded in the proper order, and given as
510
records = [(record.key, record.storage_kind)
511
for record in source.inventories.get_record_stream(
512
[('D',), ('C',), ('E',), ('F',)], 'unordered', False)]
513
self.assertEqual([(('E',), 'knit-delta-gz'), (('D',), 'knit-delta-gz'),
514
(('F',), 'knit-delta-gz'), (('C',), 'knit-delta-gz')],
517
target_branch.lock_write()
518
self.addCleanup(target_branch.unlock)
519
target = target_branch.repository
520
target.fetch(source, revision_id='F')
521
# 'C' should be expanded to a fulltext, but D and E should still be
523
stream = target.inventories.get_record_stream(
524
[('C',), ('D',), ('E',), ('F',)],
526
kinds = dict((record.key, record.storage_kind) for record in stream)
527
self.assertEqual({('C',): 'knit-ft-gz', ('D',): 'knit-delta-gz',
528
('E',): 'knit-delta-gz', ('F',): 'knit-delta-gz'},
532
class Test1To2Fetch(TestCaseWithTransport):
533
"""Tests for Model1To2 failure modes"""
535
def make_tree_and_repo(self):
536
self.tree = self.make_branch_and_tree('tree', format='pack-0.92')
537
self.repo = self.make_repository('rich-repo', format='rich-root-pack')
538
self.repo.lock_write()
539
self.addCleanup(self.repo.unlock)
541
def do_fetch_order_test(self, first, second):
542
"""Test that fetch works no matter what the set order of revision is.
544
This test depends on the order of items in a set, which is
545
implementation-dependant, so we test A, B and then B, A.
547
self.make_tree_and_repo()
548
self.tree.commit('Commit 1', rev_id=first)
549
self.tree.commit('Commit 2', rev_id=second)
550
self.repo.fetch(self.tree.branch.repository, second)
552
def test_fetch_order_AB(self):
553
"""See do_fetch_order_test"""
554
self.do_fetch_order_test('A', 'B')
556
def test_fetch_order_BA(self):
557
"""See do_fetch_order_test"""
558
self.do_fetch_order_test('B', 'A')
560
def get_parents(self, file_id, revision_id):
561
self.repo.lock_read()
563
parent_map = self.repo.texts.get_parent_map([(file_id, revision_id)])
564
return parent_map[(file_id, revision_id)]
568
def test_fetch_ghosts(self):
569
self.make_tree_and_repo()
570
self.tree.commit('first commit', rev_id='left-parent')
571
self.tree.add_parent_tree_id('ghost-parent')
572
fork = self.tree.bzrdir.sprout('fork', 'null:').open_workingtree()
573
fork.commit('not a ghost', rev_id='not-ghost-parent')
574
self.tree.branch.repository.fetch(fork.branch.repository,
576
self.tree.add_parent_tree_id('not-ghost-parent')
577
self.tree.commit('second commit', rev_id='second-id')
578
self.repo.fetch(self.tree.branch.repository, 'second-id')
579
root_id = self.tree.get_root_id()
581
((root_id, 'left-parent'), (root_id, 'not-ghost-parent')),
582
self.get_parents(root_id, 'second-id'))
584
def make_two_commits(self, change_root, fetch_twice):
585
self.make_tree_and_repo()
586
self.tree.commit('first commit', rev_id='first-id')
588
self.tree.set_root_id('unique-id')
589
self.tree.commit('second commit', rev_id='second-id')
591
self.repo.fetch(self.tree.branch.repository, 'first-id')
592
self.repo.fetch(self.tree.branch.repository, 'second-id')
594
def test_fetch_changed_root(self):
595
self.make_two_commits(change_root=True, fetch_twice=False)
596
self.assertEqual((), self.get_parents('unique-id', 'second-id'))
598
def test_two_fetch_changed_root(self):
599
self.make_two_commits(change_root=True, fetch_twice=True)
600
self.assertEqual((), self.get_parents('unique-id', 'second-id'))
602
def test_two_fetches(self):
603
self.make_two_commits(change_root=False, fetch_twice=True)
604
self.assertEqual((('TREE_ROOT', 'first-id'),),
605
self.get_parents('TREE_ROOT', 'second-id'))