~bzr-pqm/bzr/bzr.dev

2592.1.4 by Robert Collins
Create a GraphIndexBuilder.
1
# Copyright (C) 2007 Canonical Ltd
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
"""Tests for indices."""
18
2592.1.5 by Robert Collins
Trivial index reading.
19
from bzrlib import errors
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
20
from bzrlib.index import *
2592.1.4 by Robert Collins
Create a GraphIndexBuilder.
21
from bzrlib.tests import TestCaseWithMemoryTransport
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
22
from bzrlib.transport import get_transport
2592.1.4 by Robert Collins
Create a GraphIndexBuilder.
23
24
25
class TestGraphIndexBuilder(TestCaseWithMemoryTransport):
26
27
    def test_build_index_empty(self):
28
        builder = GraphIndexBuilder()
29
        stream = builder.finish()
30
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
31
        self.assertEqual(
32
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=1\nlen=0\n\n",
33
            contents)
2592.1.6 by Robert Collins
Record the number of node reference lists a particular index has.
34
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
35
    def test_build_index_empty_two_element_keys(self):
36
        builder = GraphIndexBuilder(key_elements=2)
37
        stream = builder.finish()
38
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
39
        self.assertEqual(
40
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=2\nlen=0\n\n",
41
            contents)
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
42
2592.1.6 by Robert Collins
Record the number of node reference lists a particular index has.
43
    def test_build_index_one_reference_list_empty(self):
44
        builder = GraphIndexBuilder(reference_lists=1)
45
        stream = builder.finish()
46
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
47
        self.assertEqual(
48
            "Bazaar Graph Index 1\nnode_ref_lists=1\nkey_elements=1\nlen=0\n\n",
49
            contents)
2592.1.4 by Robert Collins
Create a GraphIndexBuilder.
50
2592.1.10 by Robert Collins
Make validate detect node reference parsing errors.
51
    def test_build_index_two_reference_list_empty(self):
52
        builder = GraphIndexBuilder(reference_lists=2)
53
        stream = builder.finish()
54
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
55
        self.assertEqual(
56
            "Bazaar Graph Index 1\nnode_ref_lists=2\nkey_elements=1\nlen=0\n\n",
57
            contents)
2592.1.10 by Robert Collins
Make validate detect node reference parsing errors.
58
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
59
    def test_build_index_one_node_no_refs(self):
60
        builder = GraphIndexBuilder()
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
61
        builder.add_node(('akey', ), 'data')
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
62
        stream = builder.finish()
63
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
64
        self.assertEqual(
65
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=1\nlen=1\n"
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
66
            "akey\x00\x00\x00data\n\n", contents)
67
68
    def test_build_index_one_node_no_refs_accepts_empty_reflist(self):
69
        builder = GraphIndexBuilder()
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
70
        builder.add_node(('akey', ), 'data', ())
2592.1.12 by Robert Collins
Handle basic node adds.
71
        stream = builder.finish()
72
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
73
        self.assertEqual(
74
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=1\nlen=1\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
75
            "akey\x00\x00\x00data\n\n", contents)
2592.1.12 by Robert Collins
Handle basic node adds.
76
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
77
    def test_build_index_one_node_2_element_keys(self):
2624.2.11 by Robert Collins
Review comments.
78
        # multipart keys are separated by \x00 - because they are fixed length,
79
        # not variable this does not cause any issues, and seems clearer to the
80
        # author.
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
81
        builder = GraphIndexBuilder(key_elements=2)
82
        builder.add_node(('akey', 'secondpart'), 'data')
83
        stream = builder.finish()
84
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
85
        self.assertEqual(
86
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=2\nlen=1\n"
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
87
            "akey\x00secondpart\x00\x00\x00data\n\n", contents)
88
2592.1.21 by Robert Collins
Empty values are ok.
89
    def test_add_node_empty_value(self):
90
        builder = GraphIndexBuilder()
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
91
        builder.add_node(('akey', ), '')
2592.1.21 by Robert Collins
Empty values are ok.
92
        stream = builder.finish()
93
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
94
        self.assertEqual(
95
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=1\nlen=1\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
96
            "akey\x00\x00\x00\n\n", contents)
2592.1.21 by Robert Collins
Empty values are ok.
97
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
98
    def test_build_index_nodes_sorted(self):
2592.1.17 by Robert Collins
Multi node sort order is defined.
99
        # the highest sorted node comes first.
100
        builder = GraphIndexBuilder()
101
        # use three to have a good chance of glitching dictionary hash
102
        # lookups etc. Insert in randomish order that is not correct
103
        # and not the reverse of the correct order.
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
104
        builder.add_node(('2002', ), 'data')
105
        builder.add_node(('2000', ), 'data')
106
        builder.add_node(('2001', ), 'data')
2592.1.17 by Robert Collins
Multi node sort order is defined.
107
        stream = builder.finish()
108
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
109
        self.assertEqual(
110
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=1\nlen=3\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
111
            "2000\x00\x00\x00data\n"
112
            "2001\x00\x00\x00data\n"
113
            "2002\x00\x00\x00data\n"
2592.1.17 by Robert Collins
Multi node sort order is defined.
114
            "\n", contents)
115
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
116
    def test_build_index_2_element_key_nodes_sorted(self):
117
        # multiple element keys are sorted first-key, second-key.
118
        builder = GraphIndexBuilder(key_elements=2)
119
        # use three values of each key element, to have a good chance of
120
        # glitching dictionary hash lookups etc. Insert in randomish order that
121
        # is not correct and not the reverse of the correct order.
122
        builder.add_node(('2002', '2002'), 'data')
123
        builder.add_node(('2002', '2000'), 'data')
124
        builder.add_node(('2002', '2001'), 'data')
125
        builder.add_node(('2000', '2002'), 'data')
126
        builder.add_node(('2000', '2000'), 'data')
127
        builder.add_node(('2000', '2001'), 'data')
128
        builder.add_node(('2001', '2002'), 'data')
129
        builder.add_node(('2001', '2000'), 'data')
130
        builder.add_node(('2001', '2001'), 'data')
131
        stream = builder.finish()
132
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
133
        self.assertEqual(
134
            "Bazaar Graph Index 1\nnode_ref_lists=0\nkey_elements=2\nlen=9\n"
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
135
            "2000\x002000\x00\x00\x00data\n"
136
            "2000\x002001\x00\x00\x00data\n"
137
            "2000\x002002\x00\x00\x00data\n"
138
            "2001\x002000\x00\x00\x00data\n"
139
            "2001\x002001\x00\x00\x00data\n"
140
            "2001\x002002\x00\x00\x00data\n"
141
            "2002\x002000\x00\x00\x00data\n"
142
            "2002\x002001\x00\x00\x00data\n"
143
            "2002\x002002\x00\x00\x00data\n"
144
            "\n", contents)
145
2592.1.19 by Robert Collins
Node references are tab separated.
146
    def test_build_index_reference_lists_are_included_one(self):
147
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
148
        builder.add_node(('key', ), 'data', ([], ))
2592.1.19 by Robert Collins
Node references are tab separated.
149
        stream = builder.finish()
150
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
151
        self.assertEqual(
152
            "Bazaar Graph Index 1\nnode_ref_lists=1\nkey_elements=1\nlen=1\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
153
            "key\x00\x00\x00data\n"
2592.1.19 by Robert Collins
Node references are tab separated.
154
            "\n", contents)
155
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
156
    def test_build_index_reference_lists_with_2_element_keys(self):
157
        builder = GraphIndexBuilder(reference_lists=1, key_elements=2)
158
        builder.add_node(('key', 'key2'), 'data', ([], ))
159
        stream = builder.finish()
160
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
161
        self.assertEqual(
162
            "Bazaar Graph Index 1\nnode_ref_lists=1\nkey_elements=2\nlen=1\n"
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
163
            "key\x00key2\x00\x00\x00data\n"
164
            "\n", contents)
165
2592.1.19 by Robert Collins
Node references are tab separated.
166
    def test_build_index_reference_lists_are_included_two(self):
167
        builder = GraphIndexBuilder(reference_lists=2)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
168
        builder.add_node(('key', ), 'data', ([], []))
2592.1.19 by Robert Collins
Node references are tab separated.
169
        stream = builder.finish()
170
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
171
        self.assertEqual(
172
            "Bazaar Graph Index 1\nnode_ref_lists=2\nkey_elements=1\nlen=1\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
173
            "key\x00\x00\t\x00data\n"
2592.1.19 by Robert Collins
Node references are tab separated.
174
            "\n", contents)
175
2592.1.22 by Robert Collins
Node references are byte offsets.
176
    def test_node_references_are_byte_offsets(self):
177
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
178
        builder.add_node(('reference', ), 'data', ([], ))
179
        builder.add_node(('key', ), 'data', ([('reference', )], ))
2592.1.22 by Robert Collins
Node references are byte offsets.
180
        stream = builder.finish()
181
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
182
        self.assertEqual(
183
            "Bazaar Graph Index 1\nnode_ref_lists=1\nkey_elements=1\nlen=2\n"
184
            "key\x00\x0072\x00data\n"
2592.1.40 by Robert Collins
Reverse index ordering - we do not have date prefixed revids.
185
            "reference\x00\x00\x00data\n"
2592.1.22 by Robert Collins
Node references are byte offsets.
186
            "\n", contents)
187
2592.1.23 by Robert Collins
node reference delimiting tested.
188
    def test_node_references_are_cr_delimited(self):
189
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
190
        builder.add_node(('reference', ), 'data', ([], ))
191
        builder.add_node(('reference2', ), 'data', ([], ))
192
        builder.add_node(('key', ), 'data', ([('reference', ), ('reference2', )], ))
2592.1.23 by Robert Collins
node reference delimiting tested.
193
        stream = builder.finish()
194
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
195
        self.assertEqual(
196
            "Bazaar Graph Index 1\nnode_ref_lists=1\nkey_elements=1\nlen=3\n"
197
            "key\x00\x00077\r094\x00data\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
198
            "reference\x00\x00\x00data\n"
199
            "reference2\x00\x00\x00data\n"
2592.1.23 by Robert Collins
node reference delimiting tested.
200
            "\n", contents)
201
2592.1.24 by Robert Collins
Delimiting of multiple reference lists is by \t
202
    def test_multiple_reference_lists_are_tab_delimited(self):
203
        builder = GraphIndexBuilder(reference_lists=2)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
204
        builder.add_node(('keference', ), 'data', ([], []))
205
        builder.add_node(('rey', ), 'data', ([('keference', )], [('keference', )]))
2592.1.24 by Robert Collins
Delimiting of multiple reference lists is by \t
206
        stream = builder.finish()
207
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
208
        self.assertEqual(
209
            "Bazaar Graph Index 1\nnode_ref_lists=2\nkey_elements=1\nlen=2\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
210
            "keference\x00\x00\t\x00data\n"
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
211
            "rey\x00\x0059\t59\x00data\n"
2592.1.24 by Robert Collins
Delimiting of multiple reference lists is by \t
212
            "\n", contents)
213
2592.1.25 by Robert Collins
Fix and tune node offset calculation.
214
    def test_add_node_referencing_missing_key_makes_absent(self):
215
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
216
        builder.add_node(('rey', ), 'data', ([('beference', ), ('aeference2', )], ))
2592.1.25 by Robert Collins
Fix and tune node offset calculation.
217
        stream = builder.finish()
218
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
219
        self.assertEqual(
220
            "Bazaar Graph Index 1\nnode_ref_lists=1\nkey_elements=1\nlen=1\n"
2592.1.43 by Robert Collins
Various index tweaks and test clarity from John's review.
221
            "aeference2\x00a\x00\x00\n"
222
            "beference\x00a\x00\x00\n"
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
223
            "rey\x00\x00074\r059\x00data\n"
2592.1.25 by Robert Collins
Fix and tune node offset calculation.
224
            "\n", contents)
225
2592.1.26 by Robert Collins
Test digit buffering is accurate.
226
    def test_node_references_three_digits(self):
227
        # test the node digit expands as needed.
228
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
229
        references = [(str(val), ) for val in reversed(range(9))]
230
        builder.add_node(('2-key', ), '', (references, ))
2592.1.26 by Robert Collins
Test digit buffering is accurate.
231
        stream = builder.finish()
232
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
233
        self.assertEqual(
234
            "Bazaar Graph Index 1\nnode_ref_lists=1\nkey_elements=1\nlen=1\n"
2592.1.40 by Robert Collins
Reverse index ordering - we do not have date prefixed revids.
235
            "0\x00a\x00\x00\n"
236
            "1\x00a\x00\x00\n"
237
            "2\x00a\x00\x00\n"
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
238
            "2-key\x00\x00151\r145\r139\r133\r127\r121\r071\r065\r059\x00\n"
2592.1.40 by Robert Collins
Reverse index ordering - we do not have date prefixed revids.
239
            "3\x00a\x00\x00\n"
240
            "4\x00a\x00\x00\n"
241
            "5\x00a\x00\x00\n"
242
            "6\x00a\x00\x00\n"
243
            "7\x00a\x00\x00\n"
2592.1.26 by Robert Collins
Test digit buffering is accurate.
244
            "8\x00a\x00\x00\n"
2592.1.40 by Robert Collins
Reverse index ordering - we do not have date prefixed revids.
245
            "\n", contents)
246
247
    def test_absent_has_no_reference_overhead(self):
248
        # the offsets after an absent record should be correct when there are
249
        # >1 reference lists.
250
        builder = GraphIndexBuilder(reference_lists=2)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
251
        builder.add_node(('parent', ), '', ([('aail', ), ('zther', )], []))
2592.1.40 by Robert Collins
Reverse index ordering - we do not have date prefixed revids.
252
        stream = builder.finish()
253
        contents = stream.read()
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
254
        self.assertEqual(
255
            "Bazaar Graph Index 1\nnode_ref_lists=2\nkey_elements=1\nlen=1\n"
2592.1.40 by Robert Collins
Reverse index ordering - we do not have date prefixed revids.
256
            "aail\x00a\x00\x00\n"
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
257
            "parent\x00\x0059\r84\t\x00\n"
2592.1.40 by Robert Collins
Reverse index ordering - we do not have date prefixed revids.
258
            "zther\x00a\x00\x00\n"
2592.1.26 by Robert Collins
Test digit buffering is accurate.
259
            "\n", contents)
260
2592.1.13 by Robert Collins
Handle mismatched numbers of reference lists.
261
    def test_add_node_bad_key(self):
2592.1.12 by Robert Collins
Handle basic node adds.
262
        builder = GraphIndexBuilder()
2592.1.14 by Robert Collins
Detect bad reference key values.
263
        for bad_char in '\t\n\x0b\x0c\r\x00 ':
264
            self.assertRaises(errors.BadIndexKey, builder.add_node,
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
265
                ('a%skey' % bad_char, ), 'data')
266
        self.assertRaises(errors.BadIndexKey, builder.add_node,
267
                ('', ), 'data')
268
        self.assertRaises(errors.BadIndexKey, builder.add_node,
269
                'not-a-tuple', 'data')
270
        # not enough length
271
        self.assertRaises(errors.BadIndexKey, builder.add_node,
272
                (), 'data')
273
        # too long
274
        self.assertRaises(errors.BadIndexKey, builder.add_node,
275
                ('primary', 'secondary'), 'data')
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
276
        # secondary key elements get checked too:
277
        builder = GraphIndexBuilder(key_elements=2)
278
        for bad_char in '\t\n\x0b\x0c\r\x00 ':
279
            self.assertRaises(errors.BadIndexKey, builder.add_node,
280
                ('prefix', 'a%skey' % bad_char), 'data')
2592.1.12 by Robert Collins
Handle basic node adds.
281
2592.1.13 by Robert Collins
Handle mismatched numbers of reference lists.
282
    def test_add_node_bad_data(self):
2592.1.12 by Robert Collins
Handle basic node adds.
283
        builder = GraphIndexBuilder()
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
284
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
285
            'data\naa')
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
286
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
287
            'data\x00aa')
2592.1.12 by Robert Collins
Handle basic node adds.
288
2592.1.13 by Robert Collins
Handle mismatched numbers of reference lists.
289
    def test_add_node_bad_mismatched_ref_lists_length(self):
290
        builder = GraphIndexBuilder()
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
291
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
292
            'data aa', ([], ))
2592.1.13 by Robert Collins
Handle mismatched numbers of reference lists.
293
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
294
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
295
            'data aa')
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
296
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
297
            'data aa', (), )
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
298
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
299
            'data aa', ([], []))
2592.1.13 by Robert Collins
Handle mismatched numbers of reference lists.
300
        builder = GraphIndexBuilder(reference_lists=2)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
301
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
302
            'data aa')
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
303
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
304
            'data aa', ([], ))
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
305
        self.assertRaises(errors.BadIndexValue, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
306
            'data aa', ([], [], []))
2592.1.13 by Robert Collins
Handle mismatched numbers of reference lists.
307
2592.1.14 by Robert Collins
Detect bad reference key values.
308
    def test_add_node_bad_key_in_reference_lists(self):
309
        # first list, first key - trivial
310
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
311
        self.assertRaises(errors.BadIndexKey, builder.add_node, ('akey', ),
312
            'data aa', ([('a key', )], ))
313
        # references keys must be tuples too
314
        self.assertRaises(errors.BadIndexKey, builder.add_node, ('akey', ),
315
            'data aa', (['not-a-tuple'], ))
316
        # not enough length
317
        self.assertRaises(errors.BadIndexKey, builder.add_node, ('akey', ),
318
            'data aa', ([()], ))
319
        # too long
320
        self.assertRaises(errors.BadIndexKey, builder.add_node, ('akey', ),
321
            'data aa', ([('primary', 'secondary')], ))
2592.1.14 by Robert Collins
Detect bad reference key values.
322
        # need to check more than the first key in the list
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
323
        self.assertRaises(errors.BadIndexKey, builder.add_node, ('akey', ),
324
            'data aa', ([('agoodkey', ), ('that is a bad key', )], ))
2592.1.14 by Robert Collins
Detect bad reference key values.
325
        # and if there is more than one list it should be getting checked
326
        # too
327
        builder = GraphIndexBuilder(reference_lists=2)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
328
        self.assertRaises(errors.BadIndexKey, builder.add_node, ('akey', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
329
            'data aa', ([], ['a bad key']))
2592.1.14 by Robert Collins
Detect bad reference key values.
330
2592.1.15 by Robert Collins
Detect duplicate key insertion.
331
    def test_add_duplicate_key(self):
332
        builder = GraphIndexBuilder()
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
333
        builder.add_node(('key', ), 'data')
334
        self.assertRaises(errors.BadIndexDuplicateKey, builder.add_node, ('key', ),
2592.1.46 by Robert Collins
Make GraphIndex accept nodes as key, value, references, so that the method
335
            'data')
2592.1.15 by Robert Collins
Detect duplicate key insertion.
336
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
337
    def test_add_duplicate_key_2_elements(self):
338
        builder = GraphIndexBuilder(key_elements=2)
339
        builder.add_node(('key', 'key'), 'data')
340
        self.assertRaises(errors.BadIndexDuplicateKey, builder.add_node,
341
            ('key', 'key'), 'data')
342
2592.1.16 by Robert Collins
Can add keys after referencing them.
343
    def test_add_key_after_referencing_key(self):
344
        builder = GraphIndexBuilder(reference_lists=1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
345
        builder.add_node(('key', ), 'data', ([('reference', )], ))
346
        builder.add_node(('reference', ), 'data', ([],))
2592.1.16 by Robert Collins
Can add keys after referencing them.
347
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
348
    def test_add_key_after_referencing_key_2_elements(self):
349
        builder = GraphIndexBuilder(reference_lists=1, key_elements=2)
350
        builder.add_node(('k', 'ey'), 'data', ([('reference', 'tokey')], ))
351
        builder.add_node(('reference', 'tokey'), 'data', ([],))
352
3777.5.3 by John Arbash Meinel
Add Builder.set_optimize(for_size=True) for GraphIndexBuilder and BTreeBuilder.
353
    def test_set_optimize(self):
354
        builder = GraphIndexBuilder(reference_lists=1, key_elements=2)
355
        builder.set_optimize(for_size=True)
356
        self.assertTrue(builder._optimize_for_size)
357
        builder.set_optimize(for_size=False)
358
        self.assertFalse(builder._optimize_for_size)
359
2592.1.5 by Robert Collins
Trivial index reading.
360
361
class TestGraphIndex(TestCaseWithMemoryTransport):
362
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
363
    def make_key(self, number):
364
        return (str(number) + 'X'*100,)
365
366
    def make_value(self, number):
367
            return str(number) + 'Y'*100
368
369
    def make_nodes(self, count=64):
370
        # generate a big enough index that we only read some of it on a typical
371
        # bisection lookup.
372
        nodes = []
373
        for counter in range(count):
374
            nodes.append((self.make_key(counter), self.make_value(counter), ()))
375
        return nodes
376
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
377
    def make_index(self, ref_lists=0, key_elements=1, nodes=[]):
378
        builder = GraphIndexBuilder(ref_lists, key_elements=key_elements)
2624.2.17 by Robert Collins
Review feedback.
379
        for key, value, references in nodes:
380
            builder.add_node(key, value, references)
2592.1.5 by Robert Collins
Trivial index reading.
381
        stream = builder.finish()
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
382
        trans = get_transport('trace+' + self.get_url())
2890.2.1 by Robert Collins
* ``bzrlib.index.GraphIndex`` now requires a size parameter to the
383
        size = trans.put_file('index', stream)
384
        return GraphIndex(trans, 'index', size)
2592.1.5 by Robert Collins
Trivial index reading.
385
2592.1.7 by Robert Collins
A validate that goes boom.
386
    def test_open_bad_index_no_error(self):
387
        trans = self.get_transport()
388
        trans.put_bytes('name', "not an index\n")
2890.2.1 by Robert Collins
* ``bzrlib.index.GraphIndex`` now requires a size parameter to the
389
        index = GraphIndex(trans, 'name', 13)
2592.1.7 by Robert Collins
A validate that goes boom.
390
2890.2.2 by Robert Collins
Opening an index creates a map for the parsed bytes.
391
    def test_open_sets_parsed_map_empty(self):
392
        index = self.make_index()
393
        self.assertEqual([], index._parsed_byte_map)
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
394
        self.assertEqual([], index._parsed_key_map)
395
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
396
    def test_key_count_buffers(self):
397
        index = self.make_index(nodes=self.make_nodes(2))
398
        # reset the transport log
399
        del index._transport._activity[:]
400
        self.assertEqual(2, index.key_count())
401
        # We should have requested reading the header bytes
402
        self.assertEqual([
403
            ('readv', 'index', [(0, 200)], True, index._size),
404
            ],
405
            index._transport._activity)
406
        # And that should have been enough to trigger reading the whole index
407
        # with buffering
408
        self.assertIsNot(None, index._nodes)
409
410
    def test_lookup_key_via_location_buffers(self):
411
        index = self.make_index()
412
        # reset the transport log
413
        del index._transport._activity[:]
414
        # do a _lookup_keys_via_location call for the middle of the file, which
415
        # is what bisection uses.
416
        result = index._lookup_keys_via_location(
417
            [(index._size // 2, ('missing', ))])
418
        # this should have asked for a readv request, with adjust_for_latency,
419
        # and two regions: the header, and half-way into the file.
420
        self.assertEqual([
421
            ('readv', 'index', [(30, 30), (0, 200)], True, 60),
422
            ],
423
            index._transport._activity)
424
        # and the result should be that the key cannot be present, because this
425
        # is a trivial index.
426
        self.assertEqual([((index._size // 2, ('missing', )), False)],
427
            result)
428
        # And this should have caused the file to be fully buffered
429
        self.assertIsNot(None, index._nodes)
430
        self.assertEqual([], index._parsed_byte_map)
431
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
432
    def test_first_lookup_key_via_location(self):
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
433
        # We need enough data so that the _HEADER_READV doesn't consume the
434
        # whole file. We always read 800 bytes for every key, and the local
435
        # transport natural expansion is 4096 bytes. So we have to have >8192
436
        # bytes or we will trigger "buffer_all".
437
        # We also want the 'missing' key to fall within the range that *did*
438
        # read
439
        nodes = []
440
        index = self.make_index(nodes=self.make_nodes(64))
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
441
        # reset the transport log
442
        del index._transport._activity[:]
2890.2.18 by Robert Collins
Review feedback.
443
        # do a _lookup_keys_via_location call for the middle of the file, which
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
444
        # is what bisection uses.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
445
        start_lookup = index._size // 2
2890.2.18 by Robert Collins
Review feedback.
446
        result = index._lookup_keys_via_location(
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
447
            [(start_lookup, ('40missing', ))])
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
448
        # this should have asked for a readv request, with adjust_for_latency,
449
        # and two regions: the header, and half-way into the file.
450
        self.assertEqual([
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
451
            ('readv', 'index',
452
             [(start_lookup, 800), (0, 200)], True, index._size),
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
453
            ],
454
            index._transport._activity)
455
        # and the result should be that the key cannot be present, because this
456
        # is a trivial index.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
457
        self.assertEqual([((start_lookup, ('40missing', )), False)],
458
            result)
459
        # And this should not have caused the file to be fully buffered
460
        self.assertIs(None, index._nodes)
461
        # And the regions of the file that have been parsed should be in the
462
        # parsed_byte_map and the parsed_key_map
463
        self.assertEqual([(0, 4008), (5046, 8996)], index._parsed_byte_map)
464
        self.assertEqual([(None, self.make_key(26)),
465
                          (self.make_key(31), self.make_key(48))],
466
                         index._parsed_key_map)
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
467
468
    def test_parsing_non_adjacent_data_trims(self):
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
469
        index = self.make_index(nodes=self.make_nodes(64))
2890.2.18 by Robert Collins
Review feedback.
470
        result = index._lookup_keys_via_location(
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
471
            [(index._size // 2, ('40', ))])
472
        # and the result should be that the key cannot be present, because key is
473
        # in the middle of the observed data from a 4K read - the smallest transport
474
        # will do today with this api.
475
        self.assertEqual([((index._size // 2, ('40', )), False)],
476
            result)
477
        # and we should have a parse map that includes the header and the
478
        # region that was parsed after trimming.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
479
        self.assertEqual([(0, 4008), (5046, 8996)], index._parsed_byte_map)
480
        self.assertEqual([(None, self.make_key(26)),
481
                          (self.make_key(31), self.make_key(48))],
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
482
            index._parsed_key_map)
483
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
484
    def test_parsing_data_handles_parsed_contained_regions(self):
485
        # the following patten creates a parsed region that is wholly within a
486
        # single result from the readv layer:
487
        # .... single-read (readv-minimum-size) ...
488
        # which then trims the start and end so the parsed size is < readv
489
        # miniumum.
490
        # then a dual lookup (or a reference lookup for that matter) which
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
491
        # abuts or overlaps the parsed region on both sides will need to
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
492
        # discard the data in the middle, but parse the end as well.
493
        #
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
494
        # we test this by doing a single lookup to seed the data, then
495
        # a lookup for two keys that are present, and adjacent -
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
496
        # we except both to be found, and the parsed byte map to include the
497
        # locations of both keys.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
498
        index = self.make_index(nodes=self.make_nodes(128))
2890.2.18 by Robert Collins
Review feedback.
499
        result = index._lookup_keys_via_location(
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
500
            [(index._size // 2, ('40', ))])
501
        # and we should have a parse map that includes the header and the
502
        # region that was parsed after trimming.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
503
        self.assertEqual([(0, 4045), (11759, 15707)], index._parsed_byte_map)
504
        self.assertEqual([(None, self.make_key(116)),
505
                          (self.make_key(35), self.make_key(51))],
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
506
            index._parsed_key_map)
507
        # now ask for two keys, right before and after the parsed region
2890.2.18 by Robert Collins
Review feedback.
508
        result = index._lookup_keys_via_location(
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
509
            [(11450, self.make_key(34)), (15707, self.make_key(52))])
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
510
        self.assertEqual([
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
511
            ((11450, self.make_key(34)),
512
             (index, self.make_key(34), self.make_value(34))),
513
            ((15707, self.make_key(52)),
514
             (index, self.make_key(52), self.make_value(52))),
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
515
            ],
516
            result)
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
517
        self.assertEqual([(0, 4045), (9889, 17993)], index._parsed_byte_map)
2890.2.14 by Robert Collins
Parse more than one segment of data from a single readv response if needed.
518
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
519
    def test_lookup_missing_key_answers_without_io_when_map_permits(self):
520
        # generate a big enough index that we only read some of it on a typical
521
        # bisection lookup.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
522
        index = self.make_index(nodes=self.make_nodes(64))
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
523
        # lookup the keys in the middle of the file
2890.2.18 by Robert Collins
Review feedback.
524
        result =index._lookup_keys_via_location(
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
525
            [(index._size // 2, ('40', ))])
526
        # check the parse map, this determines the test validity
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
527
        self.assertEqual([(0, 4008), (5046, 8996)], index._parsed_byte_map)
528
        self.assertEqual([(None, self.make_key(26)),
529
                          (self.make_key(31), self.make_key(48))],
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
530
            index._parsed_key_map)
531
        # reset the transport log
532
        del index._transport._activity[:]
533
        # now looking up a key in the portion of the file already parsed should
534
        # not create a new transport request, and should return False (cannot
535
        # be in the index) - even when the byte location we ask for is outside
536
        # the parsed region
2890.2.18 by Robert Collins
Review feedback.
537
        result = index._lookup_keys_via_location(
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
538
            [(4000, ('40', ))])
539
        self.assertEqual([((4000, ('40', )), False)],
540
            result)
541
        self.assertEqual([], index._transport._activity)
542
543
    def test_lookup_present_key_answers_without_io_when_map_permits(self):
544
        # generate a big enough index that we only read some of it on a typical
545
        # bisection lookup.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
546
        index = self.make_index(nodes=self.make_nodes(64))
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
547
        # lookup the keys in the middle of the file
2890.2.18 by Robert Collins
Review feedback.
548
        result =index._lookup_keys_via_location(
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
549
            [(index._size // 2, ('40', ))])
550
        # check the parse map, this determines the test validity
551
        self.assertEqual([(0, 4008), (5046, 8996)], index._parsed_byte_map)
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
552
        self.assertEqual([(None, self.make_key(26)),
553
                          (self.make_key(31), self.make_key(48))],
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
554
            index._parsed_key_map)
555
        # reset the transport log
556
        del index._transport._activity[:]
557
        # now looking up a key in the portion of the file already parsed should
558
        # not create a new transport request, and should return False (cannot
559
        # be in the index) - even when the byte location we ask for is outside
560
        # the parsed region
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
561
        #
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
562
        result = index._lookup_keys_via_location([(4000, self.make_key(40))])
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
563
        self.assertEqual(
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
564
            [((4000, self.make_key(40)),
565
              (index, self.make_key(40), self.make_value(40)))],
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
566
            result)
567
        self.assertEqual([], index._transport._activity)
568
569
    def test_lookup_key_below_probed_area(self):
570
        # generate a big enough index that we only read some of it on a typical
571
        # bisection lookup.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
572
        index = self.make_index(nodes=self.make_nodes(64))
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
573
        # ask for the key in the middle, but a key that is located in the
574
        # unparsed region before the middle.
2890.2.18 by Robert Collins
Review feedback.
575
        result =index._lookup_keys_via_location(
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
576
            [(index._size // 2, ('30', ))])
577
        # check the parse map, this determines the test validity
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
578
        self.assertEqual([(0, 4008), (5046, 8996)], index._parsed_byte_map)
579
        self.assertEqual([(None, self.make_key(26)),
580
                          (self.make_key(31), self.make_key(48))],
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
581
            index._parsed_key_map)
582
        self.assertEqual([((index._size // 2, ('30', )), -1)],
583
            result)
584
585
    def test_lookup_key_above_probed_area(self):
586
        # generate a big enough index that we only read some of it on a typical
587
        # bisection lookup.
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
588
        index = self.make_index(nodes=self.make_nodes(64))
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
589
        # ask for the key in the middle, but a key that is located in the
590
        # unparsed region after the middle.
2890.2.18 by Robert Collins
Review feedback.
591
        result =index._lookup_keys_via_location(
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
592
            [(index._size // 2, ('50', ))])
593
        # check the parse map, this determines the test validity
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
594
        self.assertEqual([(0, 4008), (5046, 8996)], index._parsed_byte_map)
595
        self.assertEqual([(None, self.make_key(26)),
596
                          (self.make_key(31), self.make_key(48))],
2890.2.5 by Robert Collins
Create a content lookup function for bisection in GraphIndex.
597
            index._parsed_key_map)
598
        self.assertEqual([((index._size // 2, ('50', )), +1)],
599
            result)
2890.2.2 by Robert Collins
Opening an index creates a map for the parsed bytes.
600
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
601
    def test_lookup_key_resolves_references(self):
602
        # generate a big enough index that we only read some of it on a typical
603
        # bisection lookup.
604
        nodes = []
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
605
        for counter in range(99):
606
            nodes.append((self.make_key(counter), self.make_value(counter),
607
                ((self.make_key(counter + 20),),)  ))
608
        index = self.make_index(ref_lists=1, nodes=nodes)
609
        # lookup a key in the middle that does not exist, so that when we can
610
        # check that the referred-to-keys are not accessed automatically.
611
        index_size = index._size
612
        index_center = index_size // 2
613
        result = index._lookup_keys_via_location(
614
            [(index_center, ('40', ))])
615
        # check the parse map - only the start and middle should have been
616
        # parsed.
617
        self.assertEqual([(0, 4027), (10198, 14028)], index._parsed_byte_map)
618
        self.assertEqual([(None, self.make_key(17)),
619
                          (self.make_key(44), self.make_key(5))],
620
            index._parsed_key_map)
621
        # and check the transport activity likewise.
622
        self.assertEqual(
623
            [('readv', 'index', [(index_center, 800), (0, 200)], True,
624
                                  index_size)],
625
            index._transport._activity)
626
        # reset the transport log for testing the reference lookup
627
        del index._transport._activity[:]
628
        # now looking up a key in the portion of the file already parsed should
629
        # only perform IO to resolve its key references.
630
        result = index._lookup_keys_via_location([(11000, self.make_key(45))])
631
        self.assertEqual(
632
            [((11000, self.make_key(45)),
633
              (index, self.make_key(45), self.make_value(45),
634
               ((self.make_key(65),),)))],
635
            result)
636
        self.assertEqual([('readv', 'index', [(15093, 800)], True, index_size)],
637
            index._transport._activity)
638
639
    def test_lookup_key_can_buffer_all(self):
640
        nodes = []
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
641
        for counter in range(64):
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
642
            nodes.append((self.make_key(counter), self.make_value(counter),
643
                ((self.make_key(counter + 20),),)  ))
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
644
        index = self.make_index(ref_lists=1, nodes=nodes)
645
        # lookup a key in the middle that does not exist, so that when we can
646
        # check that the referred-to-keys are not accessed automatically.
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
647
        index_size = index._size
648
        index_center = index_size // 2
649
        result = index._lookup_keys_via_location([(index_center, ('40', ))])
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
650
        # check the parse map - only the start and middle should have been
651
        # parsed.
652
        self.assertEqual([(0, 3890), (6444, 10274)], index._parsed_byte_map)
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
653
        self.assertEqual([(None, self.make_key(25)),
654
                          (self.make_key(37), self.make_key(52))],
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
655
            index._parsed_key_map)
656
        # and check the transport activity likewise.
657
        self.assertEqual(
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
658
            [('readv', 'index', [(index_center, 800), (0, 200)], True,
659
                                  index_size)],
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
660
            index._transport._activity)
661
        # reset the transport log for testing the reference lookup
662
        del index._transport._activity[:]
663
        # now looking up a key in the portion of the file already parsed should
664
        # only perform IO to resolve its key references.
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
665
        result = index._lookup_keys_via_location([(7000, self.make_key(40))])
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
666
        self.assertEqual(
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
667
            [((7000, self.make_key(40)),
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
668
              (index, self.make_key(40), self.make_value(40),
669
               ((self.make_key(60),),)))],
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
670
            result)
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
671
        # Resolving the references would have required more data read, and we
672
        # are already above the 50% threshold, so it triggered a _buffer_all
673
        self.assertEqual([('get', 'index')], index._transport._activity)
2890.2.6 by Robert Collins
Add support for key references to the index lookup_keys_via_location bisection interface.
674
2592.1.5 by Robert Collins
Trivial index reading.
675
    def test_iter_all_entries_empty(self):
676
        index = self.make_index()
677
        self.assertEqual([], list(index.iter_all_entries()))
678
2592.1.27 by Robert Collins
Test missing end lines with non-empty indices.
679
    def test_iter_all_entries_simple(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
680
        index = self.make_index(nodes=[(('name', ), 'data', ())])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
681
        self.assertEqual([(index, ('name', ), 'data')],
2592.1.27 by Robert Collins
Test missing end lines with non-empty indices.
682
            list(index.iter_all_entries()))
683
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
684
    def test_iter_all_entries_simple_2_elements(self):
685
        index = self.make_index(key_elements=2,
686
            nodes=[(('name', 'surname'), 'data', ())])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
687
        self.assertEqual([(index, ('name', 'surname'), 'data')],
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
688
            list(index.iter_all_entries()))
689
2592.1.28 by Robert Collins
Basic two pass iter_all_entries.
690
    def test_iter_all_entries_references_resolved(self):
691
        index = self.make_index(1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
692
            (('name', ), 'data', ([('ref', )], )),
693
            (('ref', ), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
694
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),)),
695
            (index, ('ref', ), 'refdata', ((), ))]),
2592.1.28 by Robert Collins
Basic two pass iter_all_entries.
696
            set(index.iter_all_entries()))
697
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
698
    def test_iter_entries_buffers_once(self):
699
        index = self.make_index(nodes=self.make_nodes(2))
700
        # reset the transport log
701
        del index._transport._activity[:]
702
        self.assertEqual(set([(index, self.make_key(1), self.make_value(1))]),
703
                         set(index.iter_entries([self.make_key(1)])))
704
        # We should have requested reading the header bytes
705
        # But not needed any more than that because it would have triggered a
706
        # buffer all
707
        self.assertEqual([
708
            ('readv', 'index', [(0, 200)], True, index._size),
709
            ],
710
            index._transport._activity)
711
        # And that should have been enough to trigger reading the whole index
712
        # with buffering
713
        self.assertIsNot(None, index._nodes)
714
3665.3.3 by John Arbash Meinel
If we read more than 50% of the whole index,
715
    def test_iter_entries_buffers_by_bytes_read(self):
716
        index = self.make_index(nodes=self.make_nodes(64))
717
        list(index.iter_entries([self.make_key(10)]))
718
        # The first time through isn't enough to trigger a buffer all
719
        self.assertIs(None, index._nodes)
720
        self.assertEqual(4096, index._bytes_read)
721
        # Grabbing a key in that same page won't trigger a buffer all, as we
722
        # still haven't read 50% of the file
723
        list(index.iter_entries([self.make_key(11)]))
724
        self.assertIs(None, index._nodes)
725
        self.assertEqual(4096, index._bytes_read)
726
        # We haven't read more data, so reading outside the range won't trigger
727
        # a buffer all right away
728
        list(index.iter_entries([self.make_key(40)]))
729
        self.assertIs(None, index._nodes)
730
        self.assertEqual(8192, index._bytes_read)
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
731
        # On the next pass, we will not trigger buffer all if the key is
732
        # available without reading more
3665.3.3 by John Arbash Meinel
If we read more than 50% of the whole index,
733
        list(index.iter_entries([self.make_key(32)]))
3665.3.5 by John Arbash Meinel
Move the point at which we 'buffer_all' if we've read >50% of the index.
734
        self.assertIs(None, index._nodes)
735
        # But if we *would* need to read more to resolve it, then we will
736
        # buffer all.
737
        list(index.iter_entries([self.make_key(60)]))
3665.3.3 by John Arbash Meinel
If we read more than 50% of the whole index,
738
        self.assertIsNot(None, index._nodes)
739
2890.2.10 by Robert Collins
Add test coverage to ensure \r's are not mangled by bisection parsing.
740
    def test_iter_entries_references_resolved(self):
741
        index = self.make_index(1, nodes=[
742
            (('name', ), 'data', ([('ref', ), ('ref', )], )),
743
            (('ref', ), 'refdata', ([], ))])
744
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),('ref',)),)),
745
            (index, ('ref', ), 'refdata', ((), ))]),
746
            set(index.iter_entries([('name',), ('ref',)])))
747
748
    def test_iter_entries_references_2_refs_resolved(self):
749
        index = self.make_index(2, nodes=[
750
            (('name', ), 'data', ([('ref', )], [('ref', )])),
751
            (('ref', ), 'refdata', ([], []))])
752
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),), (('ref',),))),
753
            (index, ('ref', ), 'refdata', ((), ()))]),
754
            set(index.iter_entries([('name',), ('ref',)])))
755
2592.1.30 by Robert Collins
Absent entries are not yeilded.
756
    def test_iteration_absent_skipped(self):
757
        index = self.make_index(1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
758
            (('name', ), 'data', ([('ref', )], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
759
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),))]),
2592.1.30 by Robert Collins
Absent entries are not yeilded.
760
            set(index.iter_all_entries()))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
761
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),))]),
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
762
            set(index.iter_entries([('name', )])))
763
        self.assertEqual([], list(index.iter_entries([('ref', )])))
2592.1.30 by Robert Collins
Absent entries are not yeilded.
764
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
765
    def test_iteration_absent_skipped_2_element_keys(self):
766
        index = self.make_index(1, key_elements=2, nodes=[
767
            (('name', 'fin'), 'data', ([('ref', 'erence')], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
768
        self.assertEqual(set([(index, ('name', 'fin'), 'data', ((('ref', 'erence'),),))]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
769
            set(index.iter_all_entries()))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
770
        self.assertEqual(set([(index, ('name', 'fin'), 'data', ((('ref', 'erence'),),))]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
771
            set(index.iter_entries([('name', 'fin')])))
772
        self.assertEqual([], list(index.iter_entries([('ref', 'erence')])))
773
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
774
    def test_iter_all_keys(self):
2592.1.29 by Robert Collins
Basic iter_entries working.
775
        index = self.make_index(1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
776
            (('name', ), 'data', ([('ref', )], )),
777
            (('ref', ), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
778
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),)),
779
            (index, ('ref', ), 'refdata', ((), ))]),
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
780
            set(index.iter_entries([('name', ), ('ref', )])))
2592.1.29 by Robert Collins
Basic iter_entries working.
781
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
782
    def test_iter_nothing_empty(self):
2592.1.9 by Robert Collins
Iterating no keys should work too.
783
        index = self.make_index()
784
        self.assertEqual([], list(index.iter_entries([])))
785
2592.1.5 by Robert Collins
Trivial index reading.
786
    def test_iter_missing_entry_empty(self):
787
        index = self.make_index()
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
788
        self.assertEqual([], list(index.iter_entries([('a', )])))
2592.1.7 by Robert Collins
A validate that goes boom.
789
2890.2.8 by Robert Collins
Make the size of the index optionally None for the pack-names index.
790
    def test_iter_missing_entry_empty_no_size(self):
791
        index = self.make_index()
792
        index = GraphIndex(index._transport, 'index', None)
793
        self.assertEqual([], list(index.iter_entries([('a', )])))
794
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
795
    def test_iter_key_prefix_1_element_key_None(self):
796
        index = self.make_index()
797
        self.assertRaises(errors.BadIndexKey, list,
798
            index.iter_entries_prefix([(None, )]))
799
800
    def test_iter_key_prefix_wrong_length(self):
801
        index = self.make_index()
802
        self.assertRaises(errors.BadIndexKey, list,
803
            index.iter_entries_prefix([('foo', None)]))
804
        index = self.make_index(key_elements=2)
805
        self.assertRaises(errors.BadIndexKey, list,
806
            index.iter_entries_prefix([('foo', )]))
807
        self.assertRaises(errors.BadIndexKey, list,
808
            index.iter_entries_prefix([('foo', None, None)]))
809
810
    def test_iter_key_prefix_1_key_element_no_refs(self):
811
        index = self.make_index( nodes=[
812
            (('name', ), 'data', ()),
813
            (('ref', ), 'refdata', ())])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
814
        self.assertEqual(set([(index, ('name', ), 'data'),
815
            (index, ('ref', ), 'refdata')]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
816
            set(index.iter_entries_prefix([('name', ), ('ref', )])))
817
818
    def test_iter_key_prefix_1_key_element_refs(self):
819
        index = self.make_index(1, nodes=[
820
            (('name', ), 'data', ([('ref', )], )),
821
            (('ref', ), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
822
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),)),
823
            (index, ('ref', ), 'refdata', ((), ))]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
824
            set(index.iter_entries_prefix([('name', ), ('ref', )])))
825
826
    def test_iter_key_prefix_2_key_element_no_refs(self):
827
        index = self.make_index(key_elements=2, nodes=[
828
            (('name', 'fin1'), 'data', ()),
829
            (('name', 'fin2'), 'beta', ()),
830
            (('ref', 'erence'), 'refdata', ())])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
831
        self.assertEqual(set([(index, ('name', 'fin1'), 'data'),
832
            (index, ('ref', 'erence'), 'refdata')]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
833
            set(index.iter_entries_prefix([('name', 'fin1'), ('ref', 'erence')])))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
834
        self.assertEqual(set([(index, ('name', 'fin1'), 'data'),
835
            (index, ('name', 'fin2'), 'beta')]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
836
            set(index.iter_entries_prefix([('name', None)])))
837
838
    def test_iter_key_prefix_2_key_element_refs(self):
839
        index = self.make_index(1, key_elements=2, nodes=[
840
            (('name', 'fin1'), 'data', ([('ref', 'erence')], )),
841
            (('name', 'fin2'), 'beta', ([], )),
842
            (('ref', 'erence'), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
843
        self.assertEqual(set([(index, ('name', 'fin1'), 'data', ((('ref', 'erence'),),)),
844
            (index, ('ref', 'erence'), 'refdata', ((), ))]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
845
            set(index.iter_entries_prefix([('name', 'fin1'), ('ref', 'erence')])))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
846
        self.assertEqual(set([(index, ('name', 'fin1'), 'data', ((('ref', 'erence'),),)),
847
            (index, ('name', 'fin2'), 'beta', ((), ))]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
848
            set(index.iter_entries_prefix([('name', None)])))
849
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
850
    def test_key_count_empty(self):
851
        index = self.make_index()
852
        self.assertEqual(0, index.key_count())
853
854
    def test_key_count_one(self):
855
        index = self.make_index(nodes=[(('name', ), '', ())])
856
        self.assertEqual(1, index.key_count())
857
858
    def test_key_count_two(self):
859
        index = self.make_index(nodes=[
860
            (('name', ), '', ()), (('foo', ), '', ())])
861
        self.assertEqual(2, index.key_count())
862
3665.3.3 by John Arbash Meinel
If we read more than 50% of the whole index,
863
    def test_read_and_parse_tracks_real_read_value(self):
864
        index = self.make_index(nodes=self.make_nodes(10))
865
        del index._transport._activity[:]
866
        index._read_and_parse([(0, 200)])
867
        self.assertEqual([
868
            ('readv', 'index', [(0, 200)], True, index._size),
869
            ],
870
            index._transport._activity)
871
        # The readv expansion code will expand the initial request to 4096
872
        # bytes, which is more than enough to read the entire index, and we
873
        # will track the fact that we read that many bytes.
874
        self.assertEqual(index._size, index._bytes_read)
875
876
    def test_read_and_parse_triggers_buffer_all(self):
3665.3.1 by John Arbash Meinel
Updates to GraphIndex processing.
877
        index = self.make_index(key_elements=2, nodes=[
878
            (('name', 'fin1'), 'data', ()),
879
            (('name', 'fin2'), 'beta', ()),
880
            (('ref', 'erence'), 'refdata', ())])
881
        self.assertTrue(index._size > 0)
882
        self.assertIs(None, index._nodes)
883
        index._read_and_parse([(0, index._size)])
884
        self.assertIsNot(None, index._nodes)
885
2592.1.7 by Robert Collins
A validate that goes boom.
886
    def test_validate_bad_index_errors(self):
887
        trans = self.get_transport()
888
        trans.put_bytes('name', "not an index\n")
2890.2.1 by Robert Collins
* ``bzrlib.index.GraphIndex`` now requires a size parameter to the
889
        index = GraphIndex(trans, 'name', 13)
2592.1.7 by Robert Collins
A validate that goes boom.
890
        self.assertRaises(errors.BadIndexFormatSignature, index.validate)
2592.1.8 by Robert Collins
Empty files should validate ok.
891
2592.1.10 by Robert Collins
Make validate detect node reference parsing errors.
892
    def test_validate_bad_node_refs(self):
893
        index = self.make_index(2)
894
        trans = self.get_transport()
895
        content = trans.get_bytes('index')
896
        # change the options line to end with a rather than a parseable number
897
        new_content = content[:-2] + 'a\n\n'
898
        trans.put_bytes('index', new_content)
899
        self.assertRaises(errors.BadIndexOptions, index.validate)
900
2592.1.27 by Robert Collins
Test missing end lines with non-empty indices.
901
    def test_validate_missing_end_line_empty(self):
2592.1.11 by Robert Collins
Detect truncated indices.
902
        index = self.make_index(2)
903
        trans = self.get_transport()
904
        content = trans.get_bytes('index')
905
        # truncate the last byte
906
        trans.put_bytes('index', content[:-1])
907
        self.assertRaises(errors.BadIndexData, index.validate)
908
2592.1.27 by Robert Collins
Test missing end lines with non-empty indices.
909
    def test_validate_missing_end_line_nonempty(self):
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
910
        index = self.make_index(2, nodes=[(('key', ), '', ([], []))])
2592.1.27 by Robert Collins
Test missing end lines with non-empty indices.
911
        trans = self.get_transport()
912
        content = trans.get_bytes('index')
913
        # truncate the last byte
914
        trans.put_bytes('index', content[:-1])
915
        self.assertRaises(errors.BadIndexData, index.validate)
916
2592.1.8 by Robert Collins
Empty files should validate ok.
917
    def test_validate_empty(self):
918
        index = self.make_index()
919
        index.validate()
2592.1.12 by Robert Collins
Handle basic node adds.
920
921
    def test_validate_no_refs_content(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
922
        index = self.make_index(nodes=[(('key', ), 'value', ())])
2592.1.12 by Robert Collins
Handle basic node adds.
923
        index.validate()
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
924
4011.5.3 by Andrew Bennetts
Implement and test external_references on GraphIndex and BTreeGraphIndex.
925
    # XXX: external_references tests are duplicated in test_btree_index.  We
926
    # probably should have per_graph_index tests...
927
    def test_external_references_no_refs(self):
928
        index = self.make_index(ref_lists=0, nodes=[])
929
        self.assertRaises(ValueError, index.external_references, 0)
930
931
    def test_external_references_no_results(self):
932
        index = self.make_index(ref_lists=1, nodes=[
933
            (('key',), 'value', ([],))])
934
        self.assertEqual(set(), index.external_references(0))
935
936
    def test_external_references_missing_ref(self):
937
        missing_key = ('missing',)
938
        index = self.make_index(ref_lists=1, nodes=[
939
            (('key',), 'value', ([missing_key],))])
940
        self.assertEqual(set([missing_key]), index.external_references(0))
941
942
    def test_external_references_multiple_ref_lists(self):
943
        missing_key = ('missing',)
944
        index = self.make_index(ref_lists=2, nodes=[
945
            (('key',), 'value', ([], [missing_key]))])
946
        self.assertEqual(set([]), index.external_references(0))
947
        self.assertEqual(set([missing_key]), index.external_references(1))
948
949
    def test_external_references_two_records(self):
950
        index = self.make_index(ref_lists=1, nodes=[
951
            (('key-1',), 'value', ([('key-2',)],)),
952
            (('key-2',), 'value', ([],)),
953
            ])
954
        self.assertEqual(set([]), index.external_references(0))
955
956
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
957
class TestCombinedGraphIndex(TestCaseWithMemoryTransport):
958
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
959
    def make_index(self, name, ref_lists=0, key_elements=1, nodes=[]):
960
        builder = GraphIndexBuilder(ref_lists, key_elements=key_elements)
2624.2.17 by Robert Collins
Review feedback.
961
        for key, value, references in nodes:
962
            builder.add_node(key, value, references)
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
963
        stream = builder.finish()
964
        trans = self.get_transport()
2890.2.1 by Robert Collins
* ``bzrlib.index.GraphIndex`` now requires a size parameter to the
965
        size = trans.put_file(name, stream)
966
        return GraphIndex(trans, name, size)
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
967
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
968
    def make_combined_index_with_missing(self, missing=['1', '2']):
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
969
        """Create a CombinedGraphIndex which will have missing indexes.
970
971
        This creates a CGI which thinks it has 2 indexes, however they have
972
        been deleted. If CGI._reload_func() is called, then it will repopulate
973
        with a new index.
974
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
975
        :param missing: The underlying indexes to delete
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
976
        :return: (CombinedGraphIndex, reload_counter)
977
        """
978
        index1 = self.make_index('1', nodes=[(('1',), '', ())])
979
        index2 = self.make_index('2', nodes=[(('2',), '', ())])
980
        index3 = self.make_index('3', nodes=[
981
            (('1',), '', ()),
982
            (('2',), '', ())])
983
984
        # total_reloads, num_changed, num_unchanged
985
        reload_counter = [0, 0, 0]
986
        def reload():
987
            reload_counter[0] += 1
988
            new_indices = [index3]
989
            if index._indices == new_indices:
990
                reload_counter[2] += 1
991
                return False
992
            reload_counter[1] += 1
993
            index._indices[:] = new_indices
994
            return True
995
        index = CombinedGraphIndex([index1, index2], reload_func=reload)
996
        trans = self.get_transport()
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
997
        for fname in missing:
998
            trans.delete(fname)
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
999
        return index, reload_counter
1000
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1001
    def test_open_missing_index_no_error(self):
1002
        trans = self.get_transport()
2890.2.1 by Robert Collins
* ``bzrlib.index.GraphIndex`` now requires a size parameter to the
1003
        index1 = GraphIndex(trans, 'missing', 100)
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1004
        index = CombinedGraphIndex([index1])
1005
2592.1.37 by Robert Collins
Add CombinedGraphIndex.insert_index.
1006
    def test_add_index(self):
1007
        index = CombinedGraphIndex([])
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1008
        index1 = self.make_index('name', 0, nodes=[(('key', ), '', ())])
2592.1.37 by Robert Collins
Add CombinedGraphIndex.insert_index.
1009
        index.insert_index(0, index1)
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1010
        self.assertEqual([(index1, ('key', ), '')], list(index.iter_all_entries()))
2592.1.37 by Robert Collins
Add CombinedGraphIndex.insert_index.
1011
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1012
    def test_iter_all_entries_empty(self):
1013
        index = CombinedGraphIndex([])
1014
        self.assertEqual([], list(index.iter_all_entries()))
1015
1016
    def test_iter_all_entries_children_empty(self):
1017
        index1 = self.make_index('name')
1018
        index = CombinedGraphIndex([index1])
1019
        self.assertEqual([], list(index.iter_all_entries()))
1020
1021
    def test_iter_all_entries_simple(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1022
        index1 = self.make_index('name', nodes=[(('name', ), 'data', ())])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1023
        index = CombinedGraphIndex([index1])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1024
        self.assertEqual([(index1, ('name', ), 'data')],
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1025
            list(index.iter_all_entries()))
1026
1027
    def test_iter_all_entries_two_indices(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1028
        index1 = self.make_index('name1', nodes=[(('name', ), 'data', ())])
1029
        index2 = self.make_index('name2', nodes=[(('2', ), '', ())])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1030
        index = CombinedGraphIndex([index1, index2])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1031
        self.assertEqual([(index1, ('name', ), 'data'),
1032
            (index2, ('2', ), '')],
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1033
            list(index.iter_all_entries()))
1034
2592.1.39 by Robert Collins
CombinedGraphIndex.iter_entries does not need to see all entries.
1035
    def test_iter_entries_two_indices_dup_key(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1036
        index1 = self.make_index('name1', nodes=[(('name', ), 'data', ())])
1037
        index2 = self.make_index('name2', nodes=[(('name', ), 'data', ())])
2592.1.39 by Robert Collins
CombinedGraphIndex.iter_entries does not need to see all entries.
1038
        index = CombinedGraphIndex([index1, index2])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1039
        self.assertEqual([(index1, ('name', ), 'data')],
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1040
            list(index.iter_entries([('name', )])))
2592.1.39 by Robert Collins
CombinedGraphIndex.iter_entries does not need to see all entries.
1041
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1042
    def test_iter_all_entries_two_indices_dup_key(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1043
        index1 = self.make_index('name1', nodes=[(('name', ), 'data', ())])
1044
        index2 = self.make_index('name2', nodes=[(('name', ), 'data', ())])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1045
        index = CombinedGraphIndex([index1, index2])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1046
        self.assertEqual([(index1, ('name', ), 'data')],
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1047
            list(index.iter_all_entries()))
1048
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
1049
    def test_iter_key_prefix_2_key_element_refs(self):
1050
        index1 = self.make_index('1', 1, key_elements=2, nodes=[
1051
            (('name', 'fin1'), 'data', ([('ref', 'erence')], ))])
1052
        index2 = self.make_index('2', 1, key_elements=2, nodes=[
1053
            (('name', 'fin2'), 'beta', ([], )),
1054
            (('ref', 'erence'), 'refdata', ([], ))])
1055
        index = CombinedGraphIndex([index1, index2])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1056
        self.assertEqual(set([(index1, ('name', 'fin1'), 'data', ((('ref', 'erence'),),)),
1057
            (index2, ('ref', 'erence'), 'refdata', ((), ))]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
1058
            set(index.iter_entries_prefix([('name', 'fin1'), ('ref', 'erence')])))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1059
        self.assertEqual(set([(index1, ('name', 'fin1'), 'data', ((('ref', 'erence'),),)),
1060
            (index2, ('name', 'fin2'), 'beta', ((), ))]),
2624.2.9 by Robert Collins
Introduce multiple component keys, which is what is needed to combine multiple knit indices into one.
1061
            set(index.iter_entries_prefix([('name', None)])))
1062
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1063
    def test_iter_nothing_empty(self):
1064
        index = CombinedGraphIndex([])
1065
        self.assertEqual([], list(index.iter_entries([])))
1066
1067
    def test_iter_nothing_children_empty(self):
1068
        index1 = self.make_index('name')
1069
        index = CombinedGraphIndex([index1])
1070
        self.assertEqual([], list(index.iter_entries([])))
1071
1072
    def test_iter_all_keys(self):
1073
        index1 = self.make_index('1', 1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1074
            (('name', ), 'data', ([('ref', )], ))])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1075
        index2 = self.make_index('2', 1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1076
            (('ref', ), 'refdata', ((), ))])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1077
        index = CombinedGraphIndex([index1, index2])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1078
        self.assertEqual(set([(index1, ('name', ), 'data', ((('ref', ), ), )),
1079
            (index2, ('ref', ), 'refdata', ((), ))]),
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1080
            set(index.iter_entries([('name', ), ('ref', )])))
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
1081
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1082
    def test_iter_all_keys_dup_entry(self):
1083
        index1 = self.make_index('1', 1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1084
            (('name', ), 'data', ([('ref', )], )),
1085
            (('ref', ), 'refdata', ([], ))])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1086
        index2 = self.make_index('2', 1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1087
            (('ref', ), 'refdata', ([], ))])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1088
        index = CombinedGraphIndex([index1, index2])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1089
        self.assertEqual(set([(index1, ('name', ), 'data', ((('ref',),),)),
1090
            (index1, ('ref', ), 'refdata', ((), ))]),
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1091
            set(index.iter_entries([('name', ), ('ref', )])))
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
1092
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1093
    def test_iter_missing_entry_empty(self):
1094
        index = CombinedGraphIndex([])
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1095
        self.assertEqual([], list(index.iter_entries([('a', )])))
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1096
1097
    def test_iter_missing_entry_one_index(self):
1098
        index1 = self.make_index('1')
1099
        index = CombinedGraphIndex([index1])
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1100
        self.assertEqual([], list(index.iter_entries([('a', )])))
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1101
1102
    def test_iter_missing_entry_two_index(self):
1103
        index1 = self.make_index('1')
1104
        index2 = self.make_index('2')
1105
        index = CombinedGraphIndex([index1, index2])
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1106
        self.assertEqual([], list(index.iter_entries([('a', )])))
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
1107
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1108
    def test_iter_entry_present_one_index_only(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1109
        index1 = self.make_index('1', nodes=[(('key', ), '', ())])
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1110
        index2 = self.make_index('2', nodes=[])
1111
        index = CombinedGraphIndex([index1, index2])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1112
        self.assertEqual([(index1, ('key', ), '')],
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1113
            list(index.iter_entries([('key', )])))
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1114
        # and in the other direction
1115
        index = CombinedGraphIndex([index2, index1])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1116
        self.assertEqual([(index1, ('key', ), '')],
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1117
            list(index.iter_entries([('key', )])))
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1118
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
1119
    def test_key_count_empty(self):
1120
        index1 = self.make_index('1', nodes=[])
1121
        index2 = self.make_index('2', nodes=[])
1122
        index = CombinedGraphIndex([index1, index2])
1123
        self.assertEqual(0, index.key_count())
1124
1125
    def test_key_count_sums_index_keys(self):
1126
        index1 = self.make_index('1', nodes=[
1127
            (('1',), '', ()),
1128
            (('2',), '', ())])
1129
        index2 = self.make_index('2', nodes=[(('1',), '', ())])
1130
        index = CombinedGraphIndex([index1, index2])
1131
        self.assertEqual(3, index.key_count())
1132
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1133
    def test_validate_bad_child_index_errors(self):
1134
        trans = self.get_transport()
1135
        trans.put_bytes('name', "not an index\n")
2890.2.1 by Robert Collins
* ``bzrlib.index.GraphIndex`` now requires a size parameter to the
1136
        index1 = GraphIndex(trans, 'name', 13)
2592.1.31 by Robert Collins
Build a combined graph index to use multiple indices at once.
1137
        index = CombinedGraphIndex([index1])
1138
        self.assertRaises(errors.BadIndexFormatSignature, index.validate)
1139
1140
    def test_validate_empty(self):
1141
        index = CombinedGraphIndex([])
1142
        index.validate()
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1143
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
1144
    def test_key_count_reloads(self):
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
1145
        index, reload_counter = self.make_combined_index_with_missing()
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
1146
        self.assertEqual(2, index.key_count())
1147
        self.assertEqual([1, 1, 0], reload_counter)
1148
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
1149
    def test_key_count_no_reload(self):
1150
        index, reload_counter = self.make_combined_index_with_missing()
1151
        index._reload_func = None
1152
        # Without a _reload_func we just raise the exception
1153
        self.assertRaises(errors.NoSuchFile, index.key_count)
1154
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
1155
    def test_key_count_reloads_and_fails(self):
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
1156
        # We have deleted all underlying indexes, so we will try to reload, but
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
1157
        # still fail. This is mostly to test we don't get stuck in an infinite
1158
        # loop trying to reload
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
1159
        index, reload_counter = self.make_combined_index_with_missing(
1160
                                    ['1', '2', '3'])
3789.1.3 by John Arbash Meinel
CombinedGraphIndex can now reload when calling key_count().
1161
        self.assertRaises(errors.NoSuchFile, index.key_count)
1162
        self.assertEqual([2, 1, 1], reload_counter)
1163
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
1164
    def test_iter_entries_reloads(self):
1165
        index, reload_counter = self.make_combined_index_with_missing()
1166
        result = list(index.iter_entries([('1',), ('2',), ('3',)]))
1167
        index3 = index._indices[0]
1168
        self.assertEqual([(index3, ('1',), ''), (index3, ('2',), '')],
1169
                         result)
1170
        self.assertEqual([1, 1, 0], reload_counter)
1171
1172
    def test_iter_entries_reloads_midway(self):
1173
        # The first index still looks present, so we get interrupted mid-way
1174
        # through
1175
        index, reload_counter = self.make_combined_index_with_missing(['2'])
1176
        index1, index2 = index._indices
1177
        result = list(index.iter_entries([('1',), ('2',), ('3',)]))
1178
        index3 = index._indices[0]
3789.1.5 by John Arbash Meinel
CombinedGraphIndex.iter_all_entries() can now reload when needed.
1179
        # We had already yielded '1', so we just go on to the next, we should
3789.1.6 by John Arbash Meinel
CombinedGraphIndex.iter_entries_prefix can now reload when needed.
1180
        # not yield '1' twice.
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
1181
        self.assertEqual([(index1, ('1',), ''), (index3, ('2',), '')],
1182
                         result)
1183
        self.assertEqual([1, 1, 0], reload_counter)
1184
1185
    def test_iter_entries_no_reload(self):
1186
        index, reload_counter = self.make_combined_index_with_missing()
1187
        index._reload_func = None
1188
        # Without a _reload_func we just raise the exception
1189
        self.assertListRaises(errors.NoSuchFile, index.iter_entries, [('3',)])
1190
1191
    def test_iter_entries_reloads_and_fails(self):
1192
        index, reload_counter = self.make_combined_index_with_missing(
1193
                                    ['1', '2', '3'])
1194
        self.assertListRaises(errors.NoSuchFile, index.iter_entries, [('3',)])
1195
        self.assertEqual([2, 1, 1], reload_counter)
1196
3789.1.5 by John Arbash Meinel
CombinedGraphIndex.iter_all_entries() can now reload when needed.
1197
    def test_iter_all_entries_reloads(self):
1198
        index, reload_counter = self.make_combined_index_with_missing()
1199
        result = list(index.iter_all_entries())
1200
        index3 = index._indices[0]
1201
        self.assertEqual([(index3, ('1',), ''), (index3, ('2',), '')],
1202
                         result)
1203
        self.assertEqual([1, 1, 0], reload_counter)
1204
1205
    def test_iter_all_entries_reloads_midway(self):
1206
        index, reload_counter = self.make_combined_index_with_missing(['2'])
1207
        index1, index2 = index._indices
1208
        result = list(index.iter_all_entries())
1209
        index3 = index._indices[0]
1210
        # We had already yielded '1', so we just go on to the next, we should
3789.1.6 by John Arbash Meinel
CombinedGraphIndex.iter_entries_prefix can now reload when needed.
1211
        # not yield '1' twice.
3789.1.5 by John Arbash Meinel
CombinedGraphIndex.iter_all_entries() can now reload when needed.
1212
        self.assertEqual([(index1, ('1',), ''), (index3, ('2',), '')],
1213
                         result)
1214
        self.assertEqual([1, 1, 0], reload_counter)
1215
1216
    def test_iter_all_entries_no_reload(self):
1217
        index, reload_counter = self.make_combined_index_with_missing()
1218
        index._reload_func = None
1219
        self.assertListRaises(errors.NoSuchFile, index.iter_all_entries)
1220
1221
    def test_iter_all_entries_reloads_and_fails(self):
1222
        index, reload_counter = self.make_combined_index_with_missing(
1223
                                    ['1', '2', '3'])
1224
        self.assertListRaises(errors.NoSuchFile, index.iter_all_entries)
3789.1.4 by John Arbash Meinel
CombinedGraphIndex.iter_entries() is now able to reload on request.
1225
3789.1.6 by John Arbash Meinel
CombinedGraphIndex.iter_entries_prefix can now reload when needed.
1226
    def test_iter_entries_prefix_reloads(self):
1227
        index, reload_counter = self.make_combined_index_with_missing()
1228
        result = list(index.iter_entries_prefix([('1',)]))
1229
        index3 = index._indices[0]
1230
        self.assertEqual([(index3, ('1',), '')], result)
1231
        self.assertEqual([1, 1, 0], reload_counter)
1232
1233
    def test_iter_entries_prefix_reloads_midway(self):
1234
        index, reload_counter = self.make_combined_index_with_missing(['2'])
1235
        index1, index2 = index._indices
1236
        result = list(index.iter_entries_prefix([('1',)]))
1237
        index3 = index._indices[0]
1238
        # We had already yielded '1', so we just go on to the next, we should
1239
        # not yield '1' twice.
1240
        self.assertEqual([(index1, ('1',), '')], result)
1241
        self.assertEqual([1, 1, 0], reload_counter)
1242
1243
    def test_iter_entries_prefix_no_reload(self):
1244
        index, reload_counter = self.make_combined_index_with_missing()
1245
        index._reload_func = None
1246
        self.assertListRaises(errors.NoSuchFile, index.iter_entries_prefix,
1247
                                                 [('1',)])
1248
1249
    def test_iter_entries_prefix_reloads_and_fails(self):
1250
        index, reload_counter = self.make_combined_index_with_missing(
1251
                                    ['1', '2', '3'])
1252
        self.assertListRaises(errors.NoSuchFile, index.iter_entries_prefix,
1253
                                                 [('1',)])
1254
3789.1.7 by John Arbash Meinel
CombinedGraphIndex.validate() will now reload.
1255
    def test_validate_reloads(self):
1256
        index, reload_counter = self.make_combined_index_with_missing()
1257
        index.validate()
1258
        self.assertEqual([1, 1, 0], reload_counter)
1259
1260
    def test_validate_reloads_midway(self):
1261
        index, reload_counter = self.make_combined_index_with_missing(['2'])
1262
        index.validate()
1263
1264
    def test_validate_no_reload(self):
1265
        index, reload_counter = self.make_combined_index_with_missing()
1266
        index._reload_func = None
1267
        self.assertRaises(errors.NoSuchFile, index.validate)
1268
1269
    def test_validate_reloads_and_fails(self):
1270
        index, reload_counter = self.make_combined_index_with_missing(
1271
                                    ['1', '2', '3'])
1272
        self.assertRaises(errors.NoSuchFile, index.validate)
1273
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1274
1275
class TestInMemoryGraphIndex(TestCaseWithMemoryTransport):
1276
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1277
    def make_index(self, ref_lists=0, key_elements=1, nodes=[]):
1278
        result = InMemoryGraphIndex(ref_lists, key_elements=key_elements)
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1279
        result.add_nodes(nodes)
1280
        return result
1281
2624.2.1 by Robert Collins
InMemoryGraphIndex.add_nodes was inconsistent with other metods for non-node-reference indices.
1282
    def test_add_nodes_no_refs(self):
1283
        index = self.make_index(0)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1284
        index.add_nodes([(('name', ), 'data')])
1285
        index.add_nodes([(('name2', ), ''), (('name3', ), '')])
2624.2.1 by Robert Collins
InMemoryGraphIndex.add_nodes was inconsistent with other metods for non-node-reference indices.
1286
        self.assertEqual(set([
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1287
            (index, ('name', ), 'data'),
1288
            (index, ('name2', ), ''),
1289
            (index, ('name3', ), ''),
2624.2.1 by Robert Collins
InMemoryGraphIndex.add_nodes was inconsistent with other metods for non-node-reference indices.
1290
            ]), set(index.iter_all_entries()))
1291
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1292
    def test_add_nodes(self):
1293
        index = self.make_index(1)
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1294
        index.add_nodes([(('name', ), 'data', ([],))])
1295
        index.add_nodes([(('name2', ), '', ([],)), (('name3', ), '', ([('r', )],))])
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1296
        self.assertEqual(set([
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1297
            (index, ('name', ), 'data', ((),)),
1298
            (index, ('name2', ), '', ((),)),
1299
            (index, ('name3', ), '', ((('r', ), ), )),
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1300
            ]), set(index.iter_all_entries()))
1301
1302
    def test_iter_all_entries_empty(self):
1303
        index = self.make_index()
1304
        self.assertEqual([], list(index.iter_all_entries()))
1305
1306
    def test_iter_all_entries_simple(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1307
        index = self.make_index(nodes=[(('name', ), 'data')])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1308
        self.assertEqual([(index, ('name', ), 'data')],
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1309
            list(index.iter_all_entries()))
1310
1311
    def test_iter_all_entries_references(self):
1312
        index = self.make_index(1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1313
            (('name', ), 'data', ([('ref', )], )),
1314
            (('ref', ), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1315
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref', ),),)),
1316
            (index, ('ref', ), 'refdata', ((), ))]),
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1317
            set(index.iter_all_entries()))
1318
1319
    def test_iteration_absent_skipped(self):
1320
        index = self.make_index(1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1321
            (('name', ), 'data', ([('ref', )], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1322
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),))]),
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1323
            set(index.iter_all_entries()))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1324
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),))]),
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1325
            set(index.iter_entries([('name', )])))
1326
        self.assertEqual([], list(index.iter_entries([('ref', )])))
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1327
1328
    def test_iter_all_keys(self):
1329
        index = self.make_index(1, nodes=[
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1330
            (('name', ), 'data', ([('ref', )], )),
1331
            (('ref', ), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1332
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),)),
1333
            (index, ('ref', ), 'refdata', ((), ))]),
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1334
            set(index.iter_entries([('name', ), ('ref', )])))
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1335
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1336
    def test_iter_key_prefix_1_key_element_no_refs(self):
1337
        index = self.make_index( nodes=[
1338
            (('name', ), 'data'),
1339
            (('ref', ), 'refdata')])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1340
        self.assertEqual(set([(index, ('name', ), 'data'),
1341
            (index, ('ref', ), 'refdata')]),
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1342
            set(index.iter_entries_prefix([('name', ), ('ref', )])))
1343
1344
    def test_iter_key_prefix_1_key_element_refs(self):
1345
        index = self.make_index(1, nodes=[
1346
            (('name', ), 'data', ([('ref', )], )),
1347
            (('ref', ), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1348
        self.assertEqual(set([(index, ('name', ), 'data', ((('ref',),),)),
1349
            (index, ('ref', ), 'refdata', ((), ))]),
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1350
            set(index.iter_entries_prefix([('name', ), ('ref', )])))
1351
1352
    def test_iter_key_prefix_2_key_element_no_refs(self):
1353
        index = self.make_index(key_elements=2, nodes=[
1354
            (('name', 'fin1'), 'data'),
1355
            (('name', 'fin2'), 'beta'),
1356
            (('ref', 'erence'), 'refdata')])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1357
        self.assertEqual(set([(index, ('name', 'fin1'), 'data'),
1358
            (index, ('ref', 'erence'), 'refdata')]),
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1359
            set(index.iter_entries_prefix([('name', 'fin1'), ('ref', 'erence')])))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1360
        self.assertEqual(set([(index, ('name', 'fin1'), 'data'),
1361
            (index, ('name', 'fin2'), 'beta')]),
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1362
            set(index.iter_entries_prefix([('name', None)])))
1363
1364
    def test_iter_key_prefix_2_key_element_refs(self):
1365
        index = self.make_index(1, key_elements=2, nodes=[
1366
            (('name', 'fin1'), 'data', ([('ref', 'erence')], )),
1367
            (('name', 'fin2'), 'beta', ([], )),
1368
            (('ref', 'erence'), 'refdata', ([], ))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1369
        self.assertEqual(set([(index, ('name', 'fin1'), 'data', ((('ref', 'erence'),),)),
1370
            (index, ('ref', 'erence'), 'refdata', ((), ))]),
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1371
            set(index.iter_entries_prefix([('name', 'fin1'), ('ref', 'erence')])))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1372
        self.assertEqual(set([(index, ('name', 'fin1'), 'data', ((('ref', 'erence'),),)),
1373
            (index, ('name', 'fin2'), 'beta', ((), ))]),
2624.2.10 by Robert Collins
Also add iter_key_prefix support to InMemoryGraphIndex.
1374
            set(index.iter_entries_prefix([('name', None)])))
1375
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1376
    def test_iter_nothing_empty(self):
1377
        index = self.make_index()
1378
        self.assertEqual([], list(index.iter_entries([])))
1379
1380
    def test_iter_missing_entry_empty(self):
1381
        index = self.make_index()
1382
        self.assertEqual([], list(index.iter_entries(['a'])))
1383
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
1384
    def test_key_count_empty(self):
1385
        index = self.make_index()
1386
        self.assertEqual(0, index.key_count())
1387
1388
    def test_key_count_one(self):
1389
        index = self.make_index(nodes=[(('name', ), '')])
1390
        self.assertEqual(1, index.key_count())
1391
1392
    def test_key_count_two(self):
1393
        index = self.make_index(nodes=[(('name', ), ''), (('foo', ), '')])
1394
        self.assertEqual(2, index.key_count())
1395
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1396
    def test_validate_empty(self):
1397
        index = self.make_index()
1398
        index.validate()
1399
1400
    def test_validate_no_refs_content(self):
2624.2.5 by Robert Collins
Change bzrlib.index.Index keys to be 1-tuples, not strings.
1401
        index = self.make_index(nodes=[(('key', ), 'value')])
2592.1.38 by Robert Collins
Create an InMemoryGraphIndex for temporary indexing.
1402
        index.validate()
1403
1404
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1405
class TestGraphIndexPrefixAdapter(TestCaseWithMemoryTransport):
1406
2624.2.13 by Robert Collins
Implement add_node/add_nodes to the GraphIndexPrefixAdapter.
1407
    def make_index(self, ref_lists=1, key_elements=2, nodes=[], add_callback=False):
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1408
        result = InMemoryGraphIndex(ref_lists, key_elements=key_elements)
1409
        result.add_nodes(nodes)
2624.2.13 by Robert Collins
Implement add_node/add_nodes to the GraphIndexPrefixAdapter.
1410
        if add_callback:
2624.2.17 by Robert Collins
Review feedback.
1411
            add_nodes_callback = result.add_nodes
2624.2.13 by Robert Collins
Implement add_node/add_nodes to the GraphIndexPrefixAdapter.
1412
        else:
2624.2.17 by Robert Collins
Review feedback.
1413
            add_nodes_callback = None
2624.2.13 by Robert Collins
Implement add_node/add_nodes to the GraphIndexPrefixAdapter.
1414
        adapter = GraphIndexPrefixAdapter(result, ('prefix', ), key_elements - 1,
1415
            add_nodes_callback=add_nodes_callback)
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1416
        return result, adapter
1417
2624.2.13 by Robert Collins
Implement add_node/add_nodes to the GraphIndexPrefixAdapter.
1418
    def test_add_node(self):
1419
        index, adapter = self.make_index(add_callback=True)
1420
        adapter.add_node(('key',), 'value', ((('ref',),),))
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1421
        self.assertEqual(set([(index, ('prefix', 'key'), 'value', ((('prefix', 'ref'),),))]),
2624.2.13 by Robert Collins
Implement add_node/add_nodes to the GraphIndexPrefixAdapter.
1422
            set(index.iter_all_entries()))
1423
1424
    def test_add_nodes(self):
1425
        index, adapter = self.make_index(add_callback=True)
1426
        adapter.add_nodes((
1427
            (('key',), 'value', ((('ref',),),)),
1428
            (('key2',), 'value2', ((),)),
1429
            ))
1430
        self.assertEqual(set([
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1431
            (index, ('prefix', 'key2'), 'value2', ((),)),
1432
            (index, ('prefix', 'key'), 'value', ((('prefix', 'ref'),),))
2624.2.13 by Robert Collins
Implement add_node/add_nodes to the GraphIndexPrefixAdapter.
1433
            ]),
1434
            set(index.iter_all_entries()))
1435
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1436
    def test_construct(self):
1437
        index = InMemoryGraphIndex()
1438
        adapter = GraphIndexPrefixAdapter(index, ('prefix', ), 1)
1439
1440
    def test_construct_with_callback(self):
1441
        index = InMemoryGraphIndex()
1442
        adapter = GraphIndexPrefixAdapter(index, ('prefix', ), 1, index.add_nodes)
1443
1444
    def test_iter_all_entries_cross_prefix_map_errors(self):
1445
        index, adapter = self.make_index(nodes=[
1446
            (('prefix', 'key1'), 'data1', ((('prefixaltered', 'key2'),),))])
1447
        self.assertRaises(errors.BadIndexData, list, adapter.iter_all_entries())
1448
1449
    def test_iter_all_entries(self):
1450
        index, adapter = self.make_index(nodes=[
1451
            (('notprefix', 'key1'), 'data', ((), )),
1452
            (('prefix', 'key1'), 'data1', ((), )),
1453
            (('prefix', 'key2'), 'data2', ((('prefix', 'key1'),),))])
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1454
        self.assertEqual(set([(index, ('key1', ), 'data1', ((),)),
1455
            (index, ('key2', ), 'data2', ((('key1',),),))]),
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1456
            set(adapter.iter_all_entries()))
1457
1458
    def test_iter_entries(self):
1459
        index, adapter = self.make_index(nodes=[
1460
            (('notprefix', 'key1'), 'data', ((), )),
1461
            (('prefix', 'key1'), 'data1', ((), )),
1462
            (('prefix', 'key2'), 'data2', ((('prefix', 'key1'),),))])
1463
        # ask for many - get all
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1464
        self.assertEqual(set([(index, ('key1', ), 'data1', ((),)),
1465
            (index, ('key2', ), 'data2', ((('key1', ),),))]),
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1466
            set(adapter.iter_entries([('key1', ), ('key2', )])))
1467
        # ask for one, get one
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1468
        self.assertEqual(set([(index, ('key1', ), 'data1', ((),))]),
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1469
            set(adapter.iter_entries([('key1', )])))
1470
        # ask for missing, get none
1471
        self.assertEqual(set(),
1472
            set(adapter.iter_entries([('key3', )])))
1473
1474
    def test_iter_entries_prefix(self):
1475
        index, adapter = self.make_index(key_elements=3, nodes=[
1476
            (('notprefix', 'foo', 'key1'), 'data', ((), )),
1477
            (('prefix', 'prefix2', 'key1'), 'data1', ((), )),
1478
            (('prefix', 'prefix2', 'key2'), 'data2', ((('prefix', 'prefix2', 'key1'),),))])
1479
        # ask for a prefix, get the results for just that prefix, adjusted.
2624.2.14 by Robert Collins
Add source index to the index iteration API to allow mapping back to the origin of retrieved data.
1480
        self.assertEqual(set([(index, ('prefix2', 'key1', ), 'data1', ((),)),
1481
            (index, ('prefix2', 'key2', ), 'data2', ((('prefix2', 'key1', ),),))]),
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1482
            set(adapter.iter_entries_prefix([('prefix2', None)])))
1483
2624.2.16 by Robert Collins
Add a key_count method to GraphIndex and friends, allowing optimisation of length calculations by the index.
1484
    def test_key_count_no_matching_keys(self):
1485
        index, adapter = self.make_index(nodes=[
1486
            (('notprefix', 'key1'), 'data', ((), ))])
1487
        self.assertEqual(0, adapter.key_count())
1488
1489
    def test_key_count_some_keys(self):
1490
        index, adapter = self.make_index(nodes=[
1491
            (('notprefix', 'key1'), 'data', ((), )),
1492
            (('prefix', 'key1'), 'data1', ((), )),
1493
            (('prefix', 'key2'), 'data2', ((('prefix', 'key1'),),))])
1494
        self.assertEqual(2, adapter.key_count())
1495
2624.2.12 by Robert Collins
Create an adapter between indices with differing key lengths.
1496
    def test_validate(self):
1497
        index, adapter = self.make_index()
1498
        calls = []
1499
        def validate():
1500
            calls.append('called')
1501
        index.validate = validate
1502
        adapter.validate()
1503
        self.assertEqual(['called'], calls)