/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/tests/test_repository.py

  • Committer: Canonical.com Patch Queue Manager
  • Date: 2008-01-11 05:08:20 UTC
  • mfrom: (2535.4.31 streaming-smart-fetch)
  • Revision ID: pqm@pqm.ubuntu.com-20080111050820-eendmy6xgfc6w0yc
(andrew) Add Smart request that can stream revisions without
        buffering.

Show diffs side-by-side

added added

removed removed

Lines of Context:
1
 
# Copyright (C) 2006-2010 Canonical Ltd
 
1
# Copyright (C) 2006, 2007 Canonical Ltd
2
2
#
3
3
# This program is free software; you can redistribute it and/or modify
4
4
# it under the terms of the GNU General Public License as published by
12
12
#
13
13
# You should have received a copy of the GNU General Public License
14
14
# along with this program; if not, write to the Free Software
15
 
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
16
 
17
17
"""Tests for the Repository facility that are not interface tests.
18
18
 
19
 
For interface tests see tests/per_repository/*.py.
 
19
For interface tests see tests/repository_implementations/*.py.
20
20
 
21
21
For concrete class tests see this file, and for storage formats tests
22
22
also see this file.
23
23
"""
24
24
 
 
25
import md5
25
26
from stat import S_ISDIR
26
 
import sys
 
27
from StringIO import StringIO
27
28
 
28
29
import bzrlib
29
 
from bzrlib.errors import (NoSuchFile,
 
30
from bzrlib.errors import (NotBranchError,
 
31
                           NoSuchFile,
30
32
                           UnknownFormatError,
31
33
                           UnsupportedFormatError,
32
34
                           )
33
 
from bzrlib import (
34
 
    graph,
35
 
    tests,
36
 
    )
37
 
from bzrlib.btree_index import BTreeBuilder, BTreeGraphIndex
38
 
from bzrlib.index import GraphIndex
 
35
from bzrlib.index import GraphIndex, InMemoryGraphIndex
39
36
from bzrlib.repository import RepositoryFormat
 
37
from bzrlib.smart import server
40
38
from bzrlib.tests import (
41
39
    TestCase,
42
40
    TestCaseWithTransport,
43
 
    )
44
 
from bzrlib.transport import (
45
 
    get_transport,
46
 
    )
 
41
    test_knit,
 
42
    )
 
43
from bzrlib.transport import get_transport
 
44
from bzrlib.transport.memory import MemoryServer
 
45
from bzrlib.util import bencode
47
46
from bzrlib import (
48
47
    bzrdir,
49
48
    errors,
50
49
    inventory,
51
 
    osutils,
 
50
    progress,
52
51
    repository,
53
52
    revision as _mod_revision,
 
53
    symbol_versioning,
54
54
    upgrade,
55
 
    versionedfile,
56
55
    workingtree,
57
56
    )
58
 
from bzrlib.repofmt import (
59
 
    groupcompress_repo,
60
 
    knitrepo,
61
 
    pack_repo,
62
 
    weaverepo,
63
 
    )
 
57
from bzrlib.repofmt import knitrepo, weaverepo, pack_repo
64
58
 
65
59
 
66
60
class TestDefaultFormat(TestCase):
95
89
class SampleRepositoryFormat(repository.RepositoryFormat):
96
90
    """A sample format
97
91
 
98
 
    this format is initializable, unsupported to aid in testing the
 
92
    this format is initializable, unsupported to aid in testing the 
99
93
    open and open(unsupported=True) routines.
100
94
    """
101
95
 
122
116
    def test_find_format(self):
123
117
        # is the right format object found for a repository?
124
118
        # create a branch with a few known format objects.
125
 
        # this is not quite the same as
 
119
        # this is not quite the same as 
126
120
        self.build_tree(["foo/", "bar/"])
127
121
        def check_format(format, url):
128
122
            dir = format._matchingbzrdir.initialize(url)
131
125
            found_format = repository.RepositoryFormat.find_format(dir)
132
126
            self.failUnless(isinstance(found_format, format.__class__))
133
127
        check_format(weaverepo.RepositoryFormat7(), "bar")
134
 
 
 
128
        
135
129
    def test_find_format_no_repository(self):
136
130
        dir = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
137
131
        self.assertRaises(errors.NoRepositoryPresent,
163
157
 
164
158
class TestFormat6(TestCaseWithTransport):
165
159
 
166
 
    def test_attribute__fetch_order(self):
167
 
        """Weaves need topological data insertion."""
168
 
        control = bzrdir.BzrDirFormat6().initialize(self.get_url())
169
 
        repo = weaverepo.RepositoryFormat6().initialize(control)
170
 
        self.assertEqual('topological', repo._format._fetch_order)
171
 
 
172
 
    def test_attribute__fetch_uses_deltas(self):
173
 
        """Weaves do not reuse deltas."""
174
 
        control = bzrdir.BzrDirFormat6().initialize(self.get_url())
175
 
        repo = weaverepo.RepositoryFormat6().initialize(control)
176
 
        self.assertEqual(False, repo._format._fetch_uses_deltas)
177
 
 
178
 
    def test_attribute__fetch_reconcile(self):
179
 
        """Weave repositories need a reconcile after fetch."""
180
 
        control = bzrdir.BzrDirFormat6().initialize(self.get_url())
181
 
        repo = weaverepo.RepositoryFormat6().initialize(control)
182
 
        self.assertEqual(True, repo._format._fetch_reconcile)
183
 
 
184
160
    def test_no_ancestry_weave(self):
185
161
        control = bzrdir.BzrDirFormat6().initialize(self.get_url())
186
162
        repo = weaverepo.RepositoryFormat6().initialize(control)
190
166
                          control.transport.get,
191
167
                          'ancestry.weave')
192
168
 
193
 
    def test_supports_external_lookups(self):
 
169
    def test_exposed_versioned_files_are_marked_dirty(self):
194
170
        control = bzrdir.BzrDirFormat6().initialize(self.get_url())
195
171
        repo = weaverepo.RepositoryFormat6().initialize(control)
196
 
        self.assertFalse(repo._format.supports_external_lookups)
 
172
        repo.lock_write()
 
173
        inv = repo.get_inventory_weave()
 
174
        repo.unlock()
 
175
        self.assertRaises(errors.OutSideTransaction,
 
176
            inv.add_lines, 'foo', [], [])
197
177
 
198
178
 
199
179
class TestFormat7(TestCaseWithTransport):
200
 
 
201
 
    def test_attribute__fetch_order(self):
202
 
        """Weaves need topological data insertion."""
203
 
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
204
 
        repo = weaverepo.RepositoryFormat7().initialize(control)
205
 
        self.assertEqual('topological', repo._format._fetch_order)
206
 
 
207
 
    def test_attribute__fetch_uses_deltas(self):
208
 
        """Weaves do not reuse deltas."""
209
 
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
210
 
        repo = weaverepo.RepositoryFormat7().initialize(control)
211
 
        self.assertEqual(False, repo._format._fetch_uses_deltas)
212
 
 
213
 
    def test_attribute__fetch_reconcile(self):
214
 
        """Weave repositories need a reconcile after fetch."""
215
 
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
216
 
        repo = weaverepo.RepositoryFormat7().initialize(control)
217
 
        self.assertEqual(True, repo._format._fetch_reconcile)
218
 
 
 
180
    
219
181
    def test_disk_layout(self):
220
182
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
221
183
        repo = weaverepo.RepositoryFormat7().initialize(control)
237
199
                             'w\n'
238
200
                             'W\n',
239
201
                             t.get('inventory.weave').read())
240
 
        # Creating a file with id Foo:Bar results in a non-escaped file name on
241
 
        # disk.
242
 
        control.create_branch()
243
 
        tree = control.create_workingtree()
244
 
        tree.add(['foo'], ['Foo:Bar'], ['file'])
245
 
        tree.put_file_bytes_non_atomic('Foo:Bar', 'content\n')
246
 
        try:
247
 
            tree.commit('first post', rev_id='first')
248
 
        except errors.IllegalPath:
249
 
            if sys.platform != 'win32':
250
 
                raise
251
 
            self.knownFailure('Foo:Bar cannot be used as a file-id on windows'
252
 
                              ' in repo format 7')
253
 
            return
254
 
        self.assertEqualDiff(
255
 
            '# bzr weave file v5\n'
256
 
            'i\n'
257
 
            '1 7fe70820e08a1aac0ef224d9c66ab66831cc4ab1\n'
258
 
            'n first\n'
259
 
            '\n'
260
 
            'w\n'
261
 
            '{ 0\n'
262
 
            '. content\n'
263
 
            '}\n'
264
 
            'W\n',
265
 
            t.get('weaves/74/Foo%3ABar.weave').read())
266
202
 
267
203
    def test_shared_disk_layout(self):
268
204
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
291
227
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
292
228
        repo = weaverepo.RepositoryFormat7().initialize(control, shared=True)
293
229
        t = control.get_repository_transport(None)
294
 
        # TODO: Should check there is a 'lock' toplevel directory,
 
230
        # TODO: Should check there is a 'lock' toplevel directory, 
295
231
        # regardless of contents
296
232
        self.assertFalse(t.has('lock/held/info'))
297
233
        repo.lock_write()
343
279
                             'W\n',
344
280
                             t.get('inventory.weave').read())
345
281
 
346
 
    def test_supports_external_lookups(self):
 
282
    def test_exposed_versioned_files_are_marked_dirty(self):
347
283
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
348
284
        repo = weaverepo.RepositoryFormat7().initialize(control)
349
 
        self.assertFalse(repo._format.supports_external_lookups)
 
285
        repo.lock_write()
 
286
        inv = repo.get_inventory_weave()
 
287
        repo.unlock()
 
288
        self.assertRaises(errors.OutSideTransaction,
 
289
            inv.add_lines, 'foo', [], [])
350
290
 
351
291
 
352
292
class TestFormatKnit1(TestCaseWithTransport):
353
 
 
354
 
    def test_attribute__fetch_order(self):
355
 
        """Knits need topological data insertion."""
356
 
        repo = self.make_repository('.',
357
 
                format=bzrdir.format_registry.get('knit')())
358
 
        self.assertEqual('topological', repo._format._fetch_order)
359
 
 
360
 
    def test_attribute__fetch_uses_deltas(self):
361
 
        """Knits reuse deltas."""
362
 
        repo = self.make_repository('.',
363
 
                format=bzrdir.format_registry.get('knit')())
364
 
        self.assertEqual(True, repo._format._fetch_uses_deltas)
365
 
 
 
293
    
366
294
    def test_disk_layout(self):
367
295
        control = bzrdir.BzrDirMetaFormat1().initialize(self.get_url())
368
296
        repo = knitrepo.RepositoryFormatKnit1().initialize(control)
382
310
        # self.assertEqualDiff('', t.get('lock').read())
383
311
        self.assertTrue(S_ISDIR(t.stat('knits').st_mode))
384
312
        self.check_knits(t)
385
 
        # Check per-file knits.
386
 
        branch = control.create_branch()
387
 
        tree = control.create_workingtree()
388
 
        tree.add(['foo'], ['Nasty-IdC:'], ['file'])
389
 
        tree.put_file_bytes_non_atomic('Nasty-IdC:', '')
390
 
        tree.commit('1st post', rev_id='foo')
391
 
        self.assertHasKnit(t, 'knits/e8/%254easty-%2549d%2543%253a',
392
 
            '\nfoo fulltext 0 81  :')
393
313
 
394
 
    def assertHasKnit(self, t, knit_name, extra_content=''):
 
314
    def assertHasKnit(self, t, knit_name):
395
315
        """Assert that knit_name exists on t."""
396
 
        self.assertEqualDiff('# bzr knit index 8\n' + extra_content,
 
316
        self.assertEqualDiff('# bzr knit index 8\n',
397
317
                             t.get(knit_name + '.kndx').read())
 
318
        # no default content
 
319
        self.assertTrue(t.has(knit_name + '.knit'))
398
320
 
399
321
    def check_knits(self, t):
400
322
        """check knit content for a repository."""
444
366
        self.assertTrue(S_ISDIR(t.stat('knits').st_mode))
445
367
        self.check_knits(t)
446
368
 
 
369
    def test_exposed_versioned_files_are_marked_dirty(self):
 
370
        format = bzrdir.BzrDirMetaFormat1()
 
371
        format.repository_format = knitrepo.RepositoryFormatKnit1()
 
372
        repo = self.make_repository('.', format=format)
 
373
        repo.lock_write()
 
374
        inv = repo.get_inventory_weave()
 
375
        repo.unlock()
 
376
        self.assertRaises(errors.OutSideTransaction,
 
377
            inv.add_lines, 'foo', [], [])
 
378
 
447
379
    def test_deserialise_sets_root_revision(self):
448
380
        """We must have a inventory.root.revision
449
381
 
454
386
        repo = self.make_repository('.',
455
387
                format=bzrdir.format_registry.get('knit')())
456
388
        inv_xml = '<inventory format="5">\n</inventory>\n'
457
 
        inv = repo._deserialise_inventory('test-rev-id', inv_xml)
 
389
        inv = repo.deserialise_inventory('test-rev-id', inv_xml)
458
390
        self.assertEqual('test-rev-id', inv.root.revision)
459
391
 
460
392
    def test_deserialise_uses_global_revision_id(self):
466
398
        # Arguably, the deserialise_inventory should detect a mismatch, and
467
399
        # raise an error, rather than silently using one revision_id over the
468
400
        # other.
469
 
        self.assertRaises(AssertionError, repo._deserialise_inventory,
 
401
        self.assertRaises(AssertionError, repo.deserialise_inventory,
470
402
            'test-rev-id', inv_xml)
471
 
        inv = repo._deserialise_inventory('other-rev-id', inv_xml)
 
403
        inv = repo.deserialise_inventory('other-rev-id', inv_xml)
472
404
        self.assertEqual('other-rev-id', inv.root.revision)
473
405
 
474
 
    def test_supports_external_lookups(self):
475
 
        repo = self.make_repository('.',
476
 
                format=bzrdir.format_registry.get('knit')())
477
 
        self.assertFalse(repo._format.supports_external_lookups)
 
406
 
 
407
class KnitRepositoryStreamTests(test_knit.KnitTests):
 
408
    """Tests for knitrepo._get_stream_as_bytes."""
 
409
 
 
410
    def test_get_stream_as_bytes(self):
 
411
        # Make a simple knit
 
412
        k1 = self.make_test_knit()
 
413
        k1.add_lines('text-a', [], test_knit.split_lines(test_knit.TEXT_1))
 
414
        
 
415
        # Serialise it, check the output.
 
416
        bytes = knitrepo._get_stream_as_bytes(k1, ['text-a'])
 
417
        data = bencode.bdecode(bytes)
 
418
        format, record = data
 
419
        self.assertEqual('knit-plain', format)
 
420
        self.assertEqual(['text-a', ['fulltext'], []], record[:3])
 
421
        self.assertRecordContentEqual(k1, 'text-a', record[3])
 
422
 
 
423
    def test_get_stream_as_bytes_all(self):
 
424
        """Get a serialised data stream for all the records in a knit.
 
425
 
 
426
        Much like test_get_stream_all, except for get_stream_as_bytes.
 
427
        """
 
428
        k1 = self.make_test_knit()
 
429
        # Insert the same data as BasicKnitTests.test_knit_join, as they seem
 
430
        # to cover a range of cases (no parents, one parent, multiple parents).
 
431
        test_data = [
 
432
            ('text-a', [], test_knit.TEXT_1),
 
433
            ('text-b', ['text-a'], test_knit.TEXT_1),
 
434
            ('text-c', [], test_knit.TEXT_1),
 
435
            ('text-d', ['text-c'], test_knit.TEXT_1),
 
436
            ('text-m', ['text-b', 'text-d'], test_knit.TEXT_1),
 
437
           ]
 
438
        # This test is actually a bit strict as the order in which they're
 
439
        # returned is not defined.  This matches the current (deterministic)
 
440
        # behaviour.
 
441
        expected_data_list = [
 
442
            # version, options, parents
 
443
            ('text-a', ['fulltext'], []),
 
444
            ('text-b', ['line-delta'], ['text-a']),
 
445
            ('text-m', ['line-delta'], ['text-b', 'text-d']),
 
446
            ('text-c', ['fulltext'], []),
 
447
            ('text-d', ['line-delta'], ['text-c']),
 
448
            ]
 
449
        for version_id, parents, lines in test_data:
 
450
            k1.add_lines(version_id, parents, test_knit.split_lines(lines))
 
451
 
 
452
        bytes = knitrepo._get_stream_as_bytes(
 
453
            k1, ['text-a', 'text-b', 'text-m', 'text-c', 'text-d', ])
 
454
 
 
455
        data = bencode.bdecode(bytes)
 
456
        format = data.pop(0)
 
457
        self.assertEqual('knit-plain', format)
 
458
 
 
459
        for expected, actual in zip(expected_data_list, data):
 
460
            expected_version = expected[0]
 
461
            expected_options = expected[1]
 
462
            expected_parents = expected[2]
 
463
            version, options, parents, bytes = actual
 
464
            self.assertEqual(expected_version, version)
 
465
            self.assertEqual(expected_options, options)
 
466
            self.assertEqual(expected_parents, parents)
 
467
            self.assertRecordContentEqual(k1, version, bytes)
478
468
 
479
469
 
480
470
class DummyRepository(object):
481
471
    """A dummy repository for testing."""
482
472
 
483
 
    _format = None
484
473
    _serializer = None
485
474
 
486
475
    def supports_rich_root(self):
487
 
        if self._format is not None:
488
 
            return self._format.rich_root_data
489
476
        return False
490
477
 
491
 
    def get_graph(self):
492
 
        raise NotImplementedError
493
 
 
494
 
    def get_parent_map(self, revision_ids):
495
 
        raise NotImplementedError
496
 
 
497
478
 
498
479
class InterDummy(repository.InterRepository):
499
480
    """An inter-repository optimised code path for DummyRepository.
506
487
    @staticmethod
507
488
    def is_compatible(repo_source, repo_target):
508
489
        """InterDummy is compatible with DummyRepository."""
509
 
        return (isinstance(repo_source, DummyRepository) and
 
490
        return (isinstance(repo_source, DummyRepository) and 
510
491
            isinstance(repo_target, DummyRepository))
511
492
 
512
493
 
525
506
 
526
507
    def assertGetsDefaultInterRepository(self, repo_a, repo_b):
527
508
        """Asserts that InterRepository.get(repo_a, repo_b) -> the default.
528
 
 
 
509
        
529
510
        The effective default is now InterSameDataRepository because there is
530
511
        no actual sane default in the presence of incompatible data models.
531
512
        """
542
523
        # pair that it returns true on for the is_compatible static method
543
524
        # check
544
525
        dummy_a = DummyRepository()
545
 
        dummy_a._format = RepositoryFormat()
546
526
        dummy_b = DummyRepository()
547
 
        dummy_b._format = RepositoryFormat()
548
527
        repo = self.make_repository('.')
549
528
        # hack dummies to look like repo somewhat.
550
529
        dummy_a._serializer = repo._serializer
551
 
        dummy_a._format.supports_tree_reference = repo._format.supports_tree_reference
552
 
        dummy_a._format.rich_root_data = repo._format.rich_root_data
553
530
        dummy_b._serializer = repo._serializer
554
 
        dummy_b._format.supports_tree_reference = repo._format.supports_tree_reference
555
 
        dummy_b._format.rich_root_data = repo._format.rich_root_data
556
531
        repository.InterRepository.register_optimiser(InterDummy)
557
532
        try:
558
533
            # we should get the default for something InterDummy returns False
602
577
                                                        repo_b).__class__)
603
578
 
604
579
 
 
580
class TestInterRemoteToOther(TestCaseWithTransport):
 
581
 
 
582
    def make_remote_repository(self, path, backing_format=None):
 
583
        """Make a RemoteRepository object backed by a real repository that will
 
584
        be created at the given path."""
 
585
        self.make_repository(path, format=backing_format)
 
586
        smart_server = server.SmartTCPServer_for_testing()
 
587
        smart_server.setUp()
 
588
        remote_transport = get_transport(smart_server.get_url()).clone(path)
 
589
        self.addCleanup(smart_server.tearDown)
 
590
        remote_bzrdir = bzrdir.BzrDir.open_from_transport(remote_transport)
 
591
        remote_repo = remote_bzrdir.open_repository()
 
592
        return remote_repo
 
593
 
 
594
    def test_is_compatible_same_format(self):
 
595
        """InterRemoteToOther is compatible with a remote repository and a
 
596
        second repository that have the same format."""
 
597
        local_repo = self.make_repository('local')
 
598
        remote_repo = self.make_remote_repository('remote')
 
599
        is_compatible = repository.InterRemoteToOther.is_compatible
 
600
        self.assertTrue(
 
601
            is_compatible(remote_repo, local_repo),
 
602
            "InterRemoteToOther(%r, %r) is false" % (remote_repo, local_repo))
 
603
          
 
604
    def test_is_incompatible_different_format(self):
 
605
        local_repo = self.make_repository('local', 'dirstate')
 
606
        remote_repo = self.make_remote_repository('a', 'dirstate-with-subtree')
 
607
        is_compatible = repository.InterRemoteToOther.is_compatible
 
608
        self.assertFalse(
 
609
            is_compatible(remote_repo, local_repo),
 
610
            "InterRemoteToOther(%r, %r) is true" % (local_repo, remote_repo))
 
611
 
 
612
    def test_is_incompatible_different_format_both_remote(self):
 
613
        remote_repo_a = self.make_remote_repository(
 
614
            'a', 'dirstate-with-subtree')
 
615
        remote_repo_b = self.make_remote_repository('b', 'dirstate')
 
616
        is_compatible = repository.InterRemoteToOther.is_compatible
 
617
        self.assertFalse(
 
618
            is_compatible(remote_repo_a, remote_repo_b),
 
619
            "InterRemoteToOther(%r, %r) is true"
 
620
            % (remote_repo_a, remote_repo_b))
 
621
 
 
622
 
605
623
class TestRepositoryConverter(TestCaseWithTransport):
606
624
 
607
625
    def test_convert_empty(self):
621
639
 
622
640
 
623
641
class TestMisc(TestCase):
624
 
 
 
642
    
625
643
    def test_unescape_xml(self):
626
644
        """We get some kind of error when malformed entities are passed"""
627
 
        self.assertRaises(KeyError, repository._unescape_xml, 'foo&bar;')
 
645
        self.assertRaises(KeyError, repository._unescape_xml, 'foo&bar;') 
628
646
 
629
647
 
630
648
class TestRepositoryFormatKnit3(TestCaseWithTransport):
631
649
 
632
 
    def test_attribute__fetch_order(self):
633
 
        """Knits need topological data insertion."""
634
 
        format = bzrdir.BzrDirMetaFormat1()
635
 
        format.repository_format = knitrepo.RepositoryFormatKnit3()
636
 
        repo = self.make_repository('.', format=format)
637
 
        self.assertEqual('topological', repo._format._fetch_order)
638
 
 
639
 
    def test_attribute__fetch_uses_deltas(self):
640
 
        """Knits reuse deltas."""
641
 
        format = bzrdir.BzrDirMetaFormat1()
642
 
        format.repository_format = knitrepo.RepositoryFormatKnit3()
643
 
        repo = self.make_repository('.', format=format)
644
 
        self.assertEqual(True, repo._format._fetch_uses_deltas)
645
 
 
646
650
    def test_convert(self):
647
651
        """Ensure the upgrade adds weaves for roots"""
648
652
        format = bzrdir.BzrDirMetaFormat1()
650
654
        tree = self.make_branch_and_tree('.', format)
651
655
        tree.commit("Dull commit", rev_id="dull")
652
656
        revision_tree = tree.branch.repository.revision_tree('dull')
653
 
        revision_tree.lock_read()
654
 
        try:
655
 
            self.assertRaises(errors.NoSuchFile, revision_tree.get_file_lines,
656
 
                revision_tree.inventory.root.file_id)
657
 
        finally:
658
 
            revision_tree.unlock()
 
657
        self.assertRaises(errors.NoSuchFile, revision_tree.get_file_lines,
 
658
            revision_tree.inventory.root.file_id)
659
659
        format = bzrdir.BzrDirMetaFormat1()
660
660
        format.repository_format = knitrepo.RepositoryFormatKnit3()
661
661
        upgrade.Convert('.', format)
662
662
        tree = workingtree.WorkingTree.open('.')
663
663
        revision_tree = tree.branch.repository.revision_tree('dull')
664
 
        revision_tree.lock_read()
665
 
        try:
666
 
            revision_tree.get_file_lines(revision_tree.inventory.root.file_id)
667
 
        finally:
668
 
            revision_tree.unlock()
 
664
        revision_tree.get_file_lines(revision_tree.inventory.root.file_id)
669
665
        tree.commit("Another dull commit", rev_id='dull2')
670
666
        revision_tree = tree.branch.repository.revision_tree('dull2')
671
 
        revision_tree.lock_read()
672
 
        self.addCleanup(revision_tree.unlock)
673
667
        self.assertEqual('dull', revision_tree.inventory.root.revision)
674
668
 
675
 
    def test_supports_external_lookups(self):
 
669
    def test_exposed_versioned_files_are_marked_dirty(self):
676
670
        format = bzrdir.BzrDirMetaFormat1()
677
671
        format.repository_format = knitrepo.RepositoryFormatKnit3()
678
672
        repo = self.make_repository('.', format=format)
679
 
        self.assertFalse(repo._format.supports_external_lookups)
680
 
 
681
 
 
682
 
class Test2a(tests.TestCaseWithMemoryTransport):
683
 
 
684
 
    def test_fetch_combines_groups(self):
685
 
        builder = self.make_branch_builder('source', format='2a')
686
 
        builder.start_series()
687
 
        builder.build_snapshot('1', None, [
688
 
            ('add', ('', 'root-id', 'directory', '')),
689
 
            ('add', ('file', 'file-id', 'file', 'content\n'))])
690
 
        builder.build_snapshot('2', ['1'], [
691
 
            ('modify', ('file-id', 'content-2\n'))])
692
 
        builder.finish_series()
693
 
        source = builder.get_branch()
694
 
        target = self.make_repository('target', format='2a')
695
 
        target.fetch(source.repository)
696
 
        target.lock_read()
697
 
        self.addCleanup(target.unlock)
698
 
        details = target.texts._index.get_build_details(
699
 
            [('file-id', '1',), ('file-id', '2',)])
700
 
        file_1_details = details[('file-id', '1')]
701
 
        file_2_details = details[('file-id', '2')]
702
 
        # The index, and what to read off disk, should be the same for both
703
 
        # versions of the file.
704
 
        self.assertEqual(file_1_details[0][:3], file_2_details[0][:3])
705
 
 
706
 
    def test_fetch_combines_groups(self):
707
 
        builder = self.make_branch_builder('source', format='2a')
708
 
        builder.start_series()
709
 
        builder.build_snapshot('1', None, [
710
 
            ('add', ('', 'root-id', 'directory', '')),
711
 
            ('add', ('file', 'file-id', 'file', 'content\n'))])
712
 
        builder.build_snapshot('2', ['1'], [
713
 
            ('modify', ('file-id', 'content-2\n'))])
714
 
        builder.finish_series()
715
 
        source = builder.get_branch()
716
 
        target = self.make_repository('target', format='2a')
717
 
        target.fetch(source.repository)
718
 
        target.lock_read()
719
 
        self.addCleanup(target.unlock)
720
 
        details = target.texts._index.get_build_details(
721
 
            [('file-id', '1',), ('file-id', '2',)])
722
 
        file_1_details = details[('file-id', '1')]
723
 
        file_2_details = details[('file-id', '2')]
724
 
        # The index, and what to read off disk, should be the same for both
725
 
        # versions of the file.
726
 
        self.assertEqual(file_1_details[0][:3], file_2_details[0][:3])
727
 
 
728
 
    def test_fetch_combines_groups(self):
729
 
        builder = self.make_branch_builder('source', format='2a')
730
 
        builder.start_series()
731
 
        builder.build_snapshot('1', None, [
732
 
            ('add', ('', 'root-id', 'directory', '')),
733
 
            ('add', ('file', 'file-id', 'file', 'content\n'))])
734
 
        builder.build_snapshot('2', ['1'], [
735
 
            ('modify', ('file-id', 'content-2\n'))])
736
 
        builder.finish_series()
737
 
        source = builder.get_branch()
738
 
        target = self.make_repository('target', format='2a')
739
 
        target.fetch(source.repository)
740
 
        target.lock_read()
741
 
        self.addCleanup(target.unlock)
742
 
        details = target.texts._index.get_build_details(
743
 
            [('file-id', '1',), ('file-id', '2',)])
744
 
        file_1_details = details[('file-id', '1')]
745
 
        file_2_details = details[('file-id', '2')]
746
 
        # The index, and what to read off disk, should be the same for both
747
 
        # versions of the file.
748
 
        self.assertEqual(file_1_details[0][:3], file_2_details[0][:3])
749
 
 
750
 
    def test_format_pack_compresses_True(self):
751
 
        repo = self.make_repository('repo', format='2a')
752
 
        self.assertTrue(repo._format.pack_compresses)
753
 
 
754
 
    def test_inventories_use_chk_map_with_parent_base_dict(self):
755
 
        tree = self.make_branch_and_memory_tree('repo', format="2a")
756
 
        tree.lock_write()
757
 
        tree.add([''], ['TREE_ROOT'])
758
 
        revid = tree.commit("foo")
759
 
        tree.unlock()
760
 
        tree.lock_read()
761
 
        self.addCleanup(tree.unlock)
762
 
        inv = tree.branch.repository.get_inventory(revid)
763
 
        self.assertNotEqual(None, inv.parent_id_basename_to_file_id)
764
 
        inv.parent_id_basename_to_file_id._ensure_root()
765
 
        inv.id_to_entry._ensure_root()
766
 
        self.assertEqual(65536, inv.id_to_entry._root_node.maximum_size)
767
 
        self.assertEqual(65536,
768
 
            inv.parent_id_basename_to_file_id._root_node.maximum_size)
769
 
 
770
 
    def test_autopack_unchanged_chk_nodes(self):
771
 
        # at 20 unchanged commits, chk pages are packed that are split into
772
 
        # two groups such that the new pack being made doesn't have all its
773
 
        # pages in the source packs (though they are in the repository).
774
 
        # Use a memory backed repository, we don't need to hit disk for this
775
 
        tree = self.make_branch_and_memory_tree('tree', format='2a')
776
 
        tree.lock_write()
777
 
        self.addCleanup(tree.unlock)
778
 
        tree.add([''], ['TREE_ROOT'])
779
 
        for pos in range(20):
780
 
            tree.commit(str(pos))
781
 
 
782
 
    def test_pack_with_hint(self):
783
 
        tree = self.make_branch_and_memory_tree('tree', format='2a')
784
 
        tree.lock_write()
785
 
        self.addCleanup(tree.unlock)
786
 
        tree.add([''], ['TREE_ROOT'])
787
 
        # 1 commit to leave untouched
788
 
        tree.commit('1')
789
 
        to_keep = tree.branch.repository._pack_collection.names()
790
 
        # 2 to combine
791
 
        tree.commit('2')
792
 
        tree.commit('3')
793
 
        all = tree.branch.repository._pack_collection.names()
794
 
        combine = list(set(all) - set(to_keep))
795
 
        self.assertLength(3, all)
796
 
        self.assertLength(2, combine)
797
 
        tree.branch.repository.pack(hint=combine)
798
 
        final = tree.branch.repository._pack_collection.names()
799
 
        self.assertLength(2, final)
800
 
        self.assertFalse(combine[0] in final)
801
 
        self.assertFalse(combine[1] in final)
802
 
        self.assertSubset(to_keep, final)
803
 
 
804
 
    def test_stream_source_to_gc(self):
805
 
        source = self.make_repository('source', format='2a')
806
 
        target = self.make_repository('target', format='2a')
807
 
        stream = source._get_source(target._format)
808
 
        self.assertIsInstance(stream, groupcompress_repo.GroupCHKStreamSource)
809
 
 
810
 
    def test_stream_source_to_non_gc(self):
811
 
        source = self.make_repository('source', format='2a')
812
 
        target = self.make_repository('target', format='rich-root-pack')
813
 
        stream = source._get_source(target._format)
814
 
        # We don't want the child GroupCHKStreamSource
815
 
        self.assertIs(type(stream), repository.StreamSource)
816
 
 
817
 
    def test_get_stream_for_missing_keys_includes_all_chk_refs(self):
818
 
        source_builder = self.make_branch_builder('source',
819
 
                            format='2a')
820
 
        # We have to build a fairly large tree, so that we are sure the chk
821
 
        # pages will have split into multiple pages.
822
 
        entries = [('add', ('', 'a-root-id', 'directory', None))]
823
 
        for i in 'abcdefghijklmnopqrstuvwxyz123456789':
824
 
            for j in 'abcdefghijklmnopqrstuvwxyz123456789':
825
 
                fname = i + j
826
 
                fid = fname + '-id'
827
 
                content = 'content for %s\n' % (fname,)
828
 
                entries.append(('add', (fname, fid, 'file', content)))
829
 
        source_builder.start_series()
830
 
        source_builder.build_snapshot('rev-1', None, entries)
831
 
        # Now change a few of them, so we get a few new pages for the second
832
 
        # revision
833
 
        source_builder.build_snapshot('rev-2', ['rev-1'], [
834
 
            ('modify', ('aa-id', 'new content for aa-id\n')),
835
 
            ('modify', ('cc-id', 'new content for cc-id\n')),
836
 
            ('modify', ('zz-id', 'new content for zz-id\n')),
837
 
            ])
838
 
        source_builder.finish_series()
839
 
        source_branch = source_builder.get_branch()
840
 
        source_branch.lock_read()
841
 
        self.addCleanup(source_branch.unlock)
842
 
        target = self.make_repository('target', format='2a')
843
 
        source = source_branch.repository._get_source(target._format)
844
 
        self.assertIsInstance(source, groupcompress_repo.GroupCHKStreamSource)
845
 
 
846
 
        # On a regular pass, getting the inventories and chk pages for rev-2
847
 
        # would only get the newly created chk pages
848
 
        search = graph.SearchResult(set(['rev-2']), set(['rev-1']), 1,
849
 
                                    set(['rev-2']))
850
 
        simple_chk_records = []
851
 
        for vf_name, substream in source.get_stream(search):
852
 
            if vf_name == 'chk_bytes':
853
 
                for record in substream:
854
 
                    simple_chk_records.append(record.key)
855
 
            else:
856
 
                for _ in substream:
857
 
                    continue
858
 
        # 3 pages, the root (InternalNode), + 2 pages which actually changed
859
 
        self.assertEqual([('sha1:91481f539e802c76542ea5e4c83ad416bf219f73',),
860
 
                          ('sha1:4ff91971043668583985aec83f4f0ab10a907d3f',),
861
 
                          ('sha1:81e7324507c5ca132eedaf2d8414ee4bb2226187',),
862
 
                          ('sha1:b101b7da280596c71a4540e9a1eeba8045985ee0',)],
863
 
                         simple_chk_records)
864
 
        # Now, when we do a similar call using 'get_stream_for_missing_keys'
865
 
        # we should get a much larger set of pages.
866
 
        missing = [('inventories', 'rev-2')]
867
 
        full_chk_records = []
868
 
        for vf_name, substream in source.get_stream_for_missing_keys(missing):
869
 
            if vf_name == 'inventories':
870
 
                for record in substream:
871
 
                    self.assertEqual(('rev-2',), record.key)
872
 
            elif vf_name == 'chk_bytes':
873
 
                for record in substream:
874
 
                    full_chk_records.append(record.key)
875
 
            else:
876
 
                self.fail('Should not be getting a stream of %s' % (vf_name,))
877
 
        # We have 257 records now. This is because we have 1 root page, and 256
878
 
        # leaf pages in a complete listing.
879
 
        self.assertEqual(257, len(full_chk_records))
880
 
        self.assertSubset(simple_chk_records, full_chk_records)
881
 
 
882
 
    def test_inconsistency_fatal(self):
883
 
        repo = self.make_repository('repo', format='2a')
884
 
        self.assertTrue(repo.revisions._index._inconsistency_fatal)
885
 
        self.assertFalse(repo.texts._index._inconsistency_fatal)
886
 
        self.assertFalse(repo.inventories._index._inconsistency_fatal)
887
 
        self.assertFalse(repo.signatures._index._inconsistency_fatal)
888
 
        self.assertFalse(repo.chk_bytes._index._inconsistency_fatal)
889
 
 
890
 
 
891
 
class TestKnitPackStreamSource(tests.TestCaseWithMemoryTransport):
892
 
 
893
 
    def test_source_to_exact_pack_092(self):
894
 
        source = self.make_repository('source', format='pack-0.92')
895
 
        target = self.make_repository('target', format='pack-0.92')
896
 
        stream_source = source._get_source(target._format)
897
 
        self.assertIsInstance(stream_source, pack_repo.KnitPackStreamSource)
898
 
 
899
 
    def test_source_to_exact_pack_rich_root_pack(self):
900
 
        source = self.make_repository('source', format='rich-root-pack')
901
 
        target = self.make_repository('target', format='rich-root-pack')
902
 
        stream_source = source._get_source(target._format)
903
 
        self.assertIsInstance(stream_source, pack_repo.KnitPackStreamSource)
904
 
 
905
 
    def test_source_to_exact_pack_19(self):
906
 
        source = self.make_repository('source', format='1.9')
907
 
        target = self.make_repository('target', format='1.9')
908
 
        stream_source = source._get_source(target._format)
909
 
        self.assertIsInstance(stream_source, pack_repo.KnitPackStreamSource)
910
 
 
911
 
    def test_source_to_exact_pack_19_rich_root(self):
912
 
        source = self.make_repository('source', format='1.9-rich-root')
913
 
        target = self.make_repository('target', format='1.9-rich-root')
914
 
        stream_source = source._get_source(target._format)
915
 
        self.assertIsInstance(stream_source, pack_repo.KnitPackStreamSource)
916
 
 
917
 
    def test_source_to_remote_exact_pack_19(self):
918
 
        trans = self.make_smart_server('target')
919
 
        trans.ensure_base()
920
 
        source = self.make_repository('source', format='1.9')
921
 
        target = self.make_repository('target', format='1.9')
922
 
        target = repository.Repository.open(trans.base)
923
 
        stream_source = source._get_source(target._format)
924
 
        self.assertIsInstance(stream_source, pack_repo.KnitPackStreamSource)
925
 
 
926
 
    def test_stream_source_to_non_exact(self):
927
 
        source = self.make_repository('source', format='pack-0.92')
928
 
        target = self.make_repository('target', format='1.9')
929
 
        stream = source._get_source(target._format)
930
 
        self.assertIs(type(stream), repository.StreamSource)
931
 
 
932
 
    def test_stream_source_to_non_exact_rich_root(self):
933
 
        source = self.make_repository('source', format='1.9')
934
 
        target = self.make_repository('target', format='1.9-rich-root')
935
 
        stream = source._get_source(target._format)
936
 
        self.assertIs(type(stream), repository.StreamSource)
937
 
 
938
 
    def test_source_to_remote_non_exact_pack_19(self):
939
 
        trans = self.make_smart_server('target')
940
 
        trans.ensure_base()
941
 
        source = self.make_repository('source', format='1.9')
942
 
        target = self.make_repository('target', format='1.6')
943
 
        target = repository.Repository.open(trans.base)
944
 
        stream_source = source._get_source(target._format)
945
 
        self.assertIs(type(stream_source), repository.StreamSource)
946
 
 
947
 
    def test_stream_source_to_knit(self):
948
 
        source = self.make_repository('source', format='pack-0.92')
949
 
        target = self.make_repository('target', format='dirstate')
950
 
        stream = source._get_source(target._format)
951
 
        self.assertIs(type(stream), repository.StreamSource)
952
 
 
953
 
 
954
 
class TestDevelopment6FindParentIdsOfRevisions(TestCaseWithTransport):
955
 
    """Tests for _find_parent_ids_of_revisions."""
956
 
 
957
 
    def setUp(self):
958
 
        super(TestDevelopment6FindParentIdsOfRevisions, self).setUp()
959
 
        self.builder = self.make_branch_builder('source',
960
 
            format='development6-rich-root')
961
 
        self.builder.start_series()
962
 
        self.builder.build_snapshot('initial', None,
963
 
            [('add', ('', 'tree-root', 'directory', None))])
964
 
        self.repo = self.builder.get_branch().repository
965
 
        self.addCleanup(self.builder.finish_series)
966
 
 
967
 
    def assertParentIds(self, expected_result, rev_set):
968
 
        self.assertEqual(sorted(expected_result),
969
 
            sorted(self.repo._find_parent_ids_of_revisions(rev_set)))
970
 
 
971
 
    def test_simple(self):
972
 
        self.builder.build_snapshot('revid1', None, [])
973
 
        self.builder.build_snapshot('revid2', ['revid1'], [])
974
 
        rev_set = ['revid2']
975
 
        self.assertParentIds(['revid1'], rev_set)
976
 
 
977
 
    def test_not_first_parent(self):
978
 
        self.builder.build_snapshot('revid1', None, [])
979
 
        self.builder.build_snapshot('revid2', ['revid1'], [])
980
 
        self.builder.build_snapshot('revid3', ['revid2'], [])
981
 
        rev_set = ['revid3', 'revid2']
982
 
        self.assertParentIds(['revid1'], rev_set)
983
 
 
984
 
    def test_not_null(self):
985
 
        rev_set = ['initial']
986
 
        self.assertParentIds([], rev_set)
987
 
 
988
 
    def test_not_null_set(self):
989
 
        self.builder.build_snapshot('revid1', None, [])
990
 
        rev_set = [_mod_revision.NULL_REVISION]
991
 
        self.assertParentIds([], rev_set)
992
 
 
993
 
    def test_ghost(self):
994
 
        self.builder.build_snapshot('revid1', None, [])
995
 
        rev_set = ['ghost', 'revid1']
996
 
        self.assertParentIds(['initial'], rev_set)
997
 
 
998
 
    def test_ghost_parent(self):
999
 
        self.builder.build_snapshot('revid1', None, [])
1000
 
        self.builder.build_snapshot('revid2', ['revid1', 'ghost'], [])
1001
 
        rev_set = ['revid2', 'revid1']
1002
 
        self.assertParentIds(['ghost', 'initial'], rev_set)
1003
 
 
1004
 
    def test_righthand_parent(self):
1005
 
        self.builder.build_snapshot('revid1', None, [])
1006
 
        self.builder.build_snapshot('revid2a', ['revid1'], [])
1007
 
        self.builder.build_snapshot('revid2b', ['revid1'], [])
1008
 
        self.builder.build_snapshot('revid3', ['revid2a', 'revid2b'], [])
1009
 
        rev_set = ['revid3', 'revid2a']
1010
 
        self.assertParentIds(['revid1', 'revid2b'], rev_set)
 
673
        repo.lock_write()
 
674
        inv = repo.get_inventory_weave()
 
675
        repo.unlock()
 
676
        self.assertRaises(errors.OutSideTransaction,
 
677
            inv.add_lines, 'foo', [], [])
1011
678
 
1012
679
 
1013
680
class TestWithBrokenRepo(TestCaseWithTransport):
1028
695
            inv = inventory.Inventory(revision_id='rev1a')
1029
696
            inv.root.revision = 'rev1a'
1030
697
            self.add_file(repo, inv, 'file1', 'rev1a', [])
1031
 
            repo.texts.add_lines((inv.root.file_id, 'rev1a'), [], [])
1032
698
            repo.add_inventory('rev1a', inv, [])
1033
699
            revision = _mod_revision.Revision('rev1a',
1034
700
                committer='jrandom@example.com', timestamp=0,
1069
735
    def add_revision(self, repo, revision_id, inv, parent_ids):
1070
736
        inv.revision_id = revision_id
1071
737
        inv.root.revision = revision_id
1072
 
        repo.texts.add_lines((inv.root.file_id, revision_id), [], [])
1073
738
        repo.add_inventory(revision_id, inv, parent_ids)
1074
739
        revision = _mod_revision.Revision(revision_id,
1075
740
            committer='jrandom@example.com', timestamp=0, inventory_sha1='',
1082
747
        entry.revision = revision
1083
748
        entry.text_size = 0
1084
749
        inv.add(entry)
1085
 
        text_key = (file_id, revision)
1086
 
        parent_keys = [(file_id, parent) for parent in parents]
1087
 
        repo.texts.add_lines(text_key, parent_keys, ['line\n'])
 
750
        vf = repo.weave_store.get_weave_or_empty(file_id,
 
751
                                                 repo.get_transaction())
 
752
        vf.add_lines(revision, parents, ['line\n'])
1088
753
 
1089
754
    def test_insert_from_broken_repo(self):
1090
755
        """Inserting a data stream from a broken repository won't silently
1092
757
        """
1093
758
        broken_repo = self.make_broken_repository()
1094
759
        empty_repo = self.make_repository('empty-repo')
1095
 
        try:
1096
 
            empty_repo.fetch(broken_repo)
1097
 
        except (errors.RevisionNotPresent, errors.BzrCheckError):
1098
 
            # Test successful: compression parent not being copied leads to
1099
 
            # error.
1100
 
            return
1101
 
        empty_repo.lock_read()
 
760
        stream = broken_repo.get_data_stream(['rev1a', 'rev2', 'rev3'])
 
761
        empty_repo.lock_write()
1102
762
        self.addCleanup(empty_repo.unlock)
1103
 
        text = empty_repo.texts.get_record_stream(
1104
 
            [('file2-id', 'rev3')], 'topological', True).next()
1105
 
        self.assertEqual('line\n', text.get_bytes_as('fulltext'))
 
763
        empty_repo.start_write_group()
 
764
        try:
 
765
            self.assertRaises(
 
766
                errors.KnitCorrupt, empty_repo.insert_data_stream, stream)
 
767
        finally:
 
768
            empty_repo.abort_write_group()
 
769
 
 
770
 
 
771
class TestKnitPackNoSubtrees(TestCaseWithTransport):
 
772
 
 
773
    def get_format(self):
 
774
        return bzrdir.format_registry.make_bzrdir('pack-0.92')
 
775
 
 
776
    def test_disk_layout(self):
 
777
        format = self.get_format()
 
778
        repo = self.make_repository('.', format=format)
 
779
        # in case of side effects of locking.
 
780
        repo.lock_write()
 
781
        repo.unlock()
 
782
        t = repo.bzrdir.get_repository_transport(None)
 
783
        self.check_format(t)
 
784
        # XXX: no locks left when unlocked at the moment
 
785
        # self.assertEqualDiff('', t.get('lock').read())
 
786
        self.check_databases(t)
 
787
 
 
788
    def check_format(self, t):
 
789
        self.assertEqualDiff(
 
790
            "Bazaar pack repository format 1 (needs bzr 0.92)\n",
 
791
                             t.get('format').read())
 
792
 
 
793
    def assertHasKndx(self, t, knit_name):
 
794
        """Assert that knit_name exists on t."""
 
795
        self.assertEqualDiff('# bzr knit index 8\n',
 
796
                             t.get(knit_name + '.kndx').read())
 
797
 
 
798
    def assertHasNoKndx(self, t, knit_name):
 
799
        """Assert that knit_name has no index on t."""
 
800
        self.assertFalse(t.has(knit_name + '.kndx'))
 
801
 
 
802
    def assertHasNoKnit(self, t, knit_name):
 
803
        """Assert that knit_name exists on t."""
 
804
        # no default content
 
805
        self.assertFalse(t.has(knit_name + '.knit'))
 
806
 
 
807
    def check_databases(self, t):
 
808
        """check knit content for a repository."""
 
809
        # check conversion worked
 
810
        self.assertHasNoKndx(t, 'inventory')
 
811
        self.assertHasNoKnit(t, 'inventory')
 
812
        self.assertHasNoKndx(t, 'revisions')
 
813
        self.assertHasNoKnit(t, 'revisions')
 
814
        self.assertHasNoKndx(t, 'signatures')
 
815
        self.assertHasNoKnit(t, 'signatures')
 
816
        self.assertFalse(t.has('knits'))
 
817
        # revision-indexes file-container directory
 
818
        self.assertEqual([],
 
819
            list(GraphIndex(t, 'pack-names', None).iter_all_entries()))
 
820
        self.assertTrue(S_ISDIR(t.stat('packs').st_mode))
 
821
        self.assertTrue(S_ISDIR(t.stat('upload').st_mode))
 
822
        self.assertTrue(S_ISDIR(t.stat('indices').st_mode))
 
823
        self.assertTrue(S_ISDIR(t.stat('obsolete_packs').st_mode))
 
824
 
 
825
    def test_shared_disk_layout(self):
 
826
        format = self.get_format()
 
827
        repo = self.make_repository('.', shared=True, format=format)
 
828
        # we want:
 
829
        t = repo.bzrdir.get_repository_transport(None)
 
830
        self.check_format(t)
 
831
        # XXX: no locks left when unlocked at the moment
 
832
        # self.assertEqualDiff('', t.get('lock').read())
 
833
        # We should have a 'shared-storage' marker file.
 
834
        self.assertEqualDiff('', t.get('shared-storage').read())
 
835
        self.check_databases(t)
 
836
 
 
837
    def test_shared_no_tree_disk_layout(self):
 
838
        format = self.get_format()
 
839
        repo = self.make_repository('.', shared=True, format=format)
 
840
        repo.set_make_working_trees(False)
 
841
        # we want:
 
842
        t = repo.bzrdir.get_repository_transport(None)
 
843
        self.check_format(t)
 
844
        # XXX: no locks left when unlocked at the moment
 
845
        # self.assertEqualDiff('', t.get('lock').read())
 
846
        # We should have a 'shared-storage' marker file.
 
847
        self.assertEqualDiff('', t.get('shared-storage').read())
 
848
        # We should have a marker for the no-working-trees flag.
 
849
        self.assertEqualDiff('', t.get('no-working-trees').read())
 
850
        # The marker should go when we toggle the setting.
 
851
        repo.set_make_working_trees(True)
 
852
        self.assertFalse(t.has('no-working-trees'))
 
853
        self.check_databases(t)
 
854
 
 
855
    def test_adding_revision_creates_pack_indices(self):
 
856
        format = self.get_format()
 
857
        tree = self.make_branch_and_tree('.', format=format)
 
858
        trans = tree.branch.repository.bzrdir.get_repository_transport(None)
 
859
        self.assertEqual([],
 
860
            list(GraphIndex(trans, 'pack-names', None).iter_all_entries()))
 
861
        tree.commit('foobarbaz')
 
862
        index = GraphIndex(trans, 'pack-names', None)
 
863
        index_nodes = list(index.iter_all_entries())
 
864
        self.assertEqual(1, len(index_nodes))
 
865
        node = index_nodes[0]
 
866
        name = node[1][0]
 
867
        # the pack sizes should be listed in the index
 
868
        pack_value = node[2]
 
869
        sizes = [int(digits) for digits in pack_value.split(' ')]
 
870
        for size, suffix in zip(sizes, ['.rix', '.iix', '.tix', '.six']):
 
871
            stat = trans.stat('indices/%s%s' % (name, suffix))
 
872
            self.assertEqual(size, stat.st_size)
 
873
 
 
874
    def test_pulling_nothing_leads_to_no_new_names(self):
 
875
        format = self.get_format()
 
876
        tree1 = self.make_branch_and_tree('1', format=format)
 
877
        tree2 = self.make_branch_and_tree('2', format=format)
 
878
        tree1.branch.repository.fetch(tree2.branch.repository)
 
879
        trans = tree1.branch.repository.bzrdir.get_repository_transport(None)
 
880
        self.assertEqual([],
 
881
            list(GraphIndex(trans, 'pack-names', None).iter_all_entries()))
 
882
 
 
883
    def test_commit_across_pack_shape_boundary_autopacks(self):
 
884
        format = self.get_format()
 
885
        tree = self.make_branch_and_tree('.', format=format)
 
886
        trans = tree.branch.repository.bzrdir.get_repository_transport(None)
 
887
        # This test could be a little cheaper by replacing the packs
 
888
        # attribute on the repository to allow a different pack distribution
 
889
        # and max packs policy - so we are checking the policy is honoured
 
890
        # in the test. But for now 11 commits is not a big deal in a single
 
891
        # test.
 
892
        for x in range(9):
 
893
            tree.commit('commit %s' % x)
 
894
        # there should be 9 packs:
 
895
        index = GraphIndex(trans, 'pack-names', None)
 
896
        self.assertEqual(9, len(list(index.iter_all_entries())))
 
897
        # insert some files in obsolete_packs which should be removed by pack.
 
898
        trans.put_bytes('obsolete_packs/foo', '123')
 
899
        trans.put_bytes('obsolete_packs/bar', '321')
 
900
        # committing one more should coalesce to 1 of 10.
 
901
        tree.commit('commit triggering pack')
 
902
        index = GraphIndex(trans, 'pack-names', None)
 
903
        self.assertEqual(1, len(list(index.iter_all_entries())))
 
904
        # packing should not damage data
 
905
        tree = tree.bzrdir.open_workingtree()
 
906
        check_result = tree.branch.repository.check(
 
907
            [tree.branch.last_revision()])
 
908
        # We should have 50 (10x5) files in the obsolete_packs directory.
 
909
        obsolete_files = list(trans.list_dir('obsolete_packs'))
 
910
        self.assertFalse('foo' in obsolete_files)
 
911
        self.assertFalse('bar' in obsolete_files)
 
912
        self.assertEqual(50, len(obsolete_files))
 
913
        # XXX: Todo check packs obsoleted correctly - old packs and indices
 
914
        # in the obsolete_packs directory.
 
915
        large_pack_name = list(index.iter_all_entries())[0][1][0]
 
916
        # finally, committing again should not touch the large pack.
 
917
        tree.commit('commit not triggering pack')
 
918
        index = GraphIndex(trans, 'pack-names', None)
 
919
        self.assertEqual(2, len(list(index.iter_all_entries())))
 
920
        pack_names = [node[1][0] for node in index.iter_all_entries()]
 
921
        self.assertTrue(large_pack_name in pack_names)
 
922
 
 
923
    def test_pack_after_two_commits_packs_everything(self):
 
924
        format = self.get_format()
 
925
        tree = self.make_branch_and_tree('.', format=format)
 
926
        trans = tree.branch.repository.bzrdir.get_repository_transport(None)
 
927
        tree.commit('start')
 
928
        tree.commit('more work')
 
929
        tree.branch.repository.pack()
 
930
        # there should be 1 pack:
 
931
        index = GraphIndex(trans, 'pack-names', None)
 
932
        self.assertEqual(1, len(list(index.iter_all_entries())))
 
933
        self.assertEqual(2, len(tree.branch.repository.all_revision_ids()))
 
934
 
 
935
    def test_pack_layout(self):
 
936
        format = self.get_format()
 
937
        tree = self.make_branch_and_tree('.', format=format)
 
938
        trans = tree.branch.repository.bzrdir.get_repository_transport(None)
 
939
        tree.commit('start', rev_id='1')
 
940
        tree.commit('more work', rev_id='2')
 
941
        tree.branch.repository.pack()
 
942
        tree.lock_read()
 
943
        self.addCleanup(tree.unlock)
 
944
        pack = tree.branch.repository._pack_collection.get_pack_by_name(
 
945
            tree.branch.repository._pack_collection.names()[0])
 
946
        # revision access tends to be tip->ancestor, so ordering that way on 
 
947
        # disk is a good idea.
 
948
        for _1, key, val, refs in pack.revision_index.iter_all_entries():
 
949
            if key == ('1',):
 
950
                pos_1 = int(val[1:].split()[0])
 
951
            else:
 
952
                pos_2 = int(val[1:].split()[0])
 
953
        self.assertTrue(pos_2 < pos_1)
 
954
 
 
955
    def test_pack_repositories_support_multiple_write_locks(self):
 
956
        format = self.get_format()
 
957
        self.make_repository('.', shared=True, format=format)
 
958
        r1 = repository.Repository.open('.')
 
959
        r2 = repository.Repository.open('.')
 
960
        r1.lock_write()
 
961
        self.addCleanup(r1.unlock)
 
962
        r2.lock_write()
 
963
        r2.unlock()
 
964
 
 
965
    def _add_text(self, repo, fileid):
 
966
        """Add a text to the repository within a write group."""
 
967
        vf =repo.weave_store.get_weave(fileid, repo.get_transaction())
 
968
        vf.add_lines('samplerev+' + fileid, [], [])
 
969
 
 
970
    def test_concurrent_writers_merge_new_packs(self):
 
971
        format = self.get_format()
 
972
        self.make_repository('.', shared=True, format=format)
 
973
        r1 = repository.Repository.open('.')
 
974
        r2 = repository.Repository.open('.')
 
975
        r1.lock_write()
 
976
        try:
 
977
            # access enough data to load the names list
 
978
            list(r1.all_revision_ids())
 
979
            r2.lock_write()
 
980
            try:
 
981
                # access enough data to load the names list
 
982
                list(r2.all_revision_ids())
 
983
                r1.start_write_group()
 
984
                try:
 
985
                    r2.start_write_group()
 
986
                    try:
 
987
                        self._add_text(r1, 'fileidr1')
 
988
                        self._add_text(r2, 'fileidr2')
 
989
                    except:
 
990
                        r2.abort_write_group()
 
991
                        raise
 
992
                except:
 
993
                    r1.abort_write_group()
 
994
                    raise
 
995
                # both r1 and r2 have open write groups with data in them
 
996
                # created while the other's write group was open.
 
997
                # Commit both which requires a merge to the pack-names.
 
998
                try:
 
999
                    r1.commit_write_group()
 
1000
                except:
 
1001
                    r1.abort_write_group()
 
1002
                    r2.abort_write_group()
 
1003
                    raise
 
1004
                r2.commit_write_group()
 
1005
                # tell r1 to reload from disk
 
1006
                r1._pack_collection.reset()
 
1007
                # Now both repositories should know about both names
 
1008
                r1._pack_collection.ensure_loaded()
 
1009
                r2._pack_collection.ensure_loaded()
 
1010
                self.assertEqual(r1._pack_collection.names(), r2._pack_collection.names())
 
1011
                self.assertEqual(2, len(r1._pack_collection.names()))
 
1012
            finally:
 
1013
                r2.unlock()
 
1014
        finally:
 
1015
            r1.unlock()
 
1016
 
 
1017
    def test_concurrent_writer_second_preserves_dropping_a_pack(self):
 
1018
        format = self.get_format()
 
1019
        self.make_repository('.', shared=True, format=format)
 
1020
        r1 = repository.Repository.open('.')
 
1021
        r2 = repository.Repository.open('.')
 
1022
        # add a pack to drop
 
1023
        r1.lock_write()
 
1024
        try:
 
1025
            r1.start_write_group()
 
1026
            try:
 
1027
                self._add_text(r1, 'fileidr1')
 
1028
            except:
 
1029
                r1.abort_write_group()
 
1030
                raise
 
1031
            else:
 
1032
                r1.commit_write_group()
 
1033
            r1._pack_collection.ensure_loaded()
 
1034
            name_to_drop = r1._pack_collection.all_packs()[0].name
 
1035
        finally:
 
1036
            r1.unlock()
 
1037
        r1.lock_write()
 
1038
        try:
 
1039
            # access enough data to load the names list
 
1040
            list(r1.all_revision_ids())
 
1041
            r2.lock_write()
 
1042
            try:
 
1043
                # access enough data to load the names list
 
1044
                list(r2.all_revision_ids())
 
1045
                r1._pack_collection.ensure_loaded()
 
1046
                try:
 
1047
                    r2.start_write_group()
 
1048
                    try:
 
1049
                        # in r1, drop the pack
 
1050
                        r1._pack_collection._remove_pack_from_memory(
 
1051
                            r1._pack_collection.get_pack_by_name(name_to_drop))
 
1052
                        # in r2, add a pack
 
1053
                        self._add_text(r2, 'fileidr2')
 
1054
                    except:
 
1055
                        r2.abort_write_group()
 
1056
                        raise
 
1057
                except:
 
1058
                    r1._pack_collection.reset()
 
1059
                    raise
 
1060
                # r1 has a changed names list, and r2 an open write groups with
 
1061
                # changes.
 
1062
                # save r1, and then commit the r2 write group, which requires a
 
1063
                # merge to the pack-names, which should not reinstate
 
1064
                # name_to_drop
 
1065
                try:
 
1066
                    r1._pack_collection._save_pack_names()
 
1067
                    r1._pack_collection.reset()
 
1068
                except:
 
1069
                    r2.abort_write_group()
 
1070
                    raise
 
1071
                try:
 
1072
                    r2.commit_write_group()
 
1073
                except:
 
1074
                    r2.abort_write_group()
 
1075
                    raise
 
1076
                # Now both repositories should now about just one name.
 
1077
                r1._pack_collection.ensure_loaded()
 
1078
                r2._pack_collection.ensure_loaded()
 
1079
                self.assertEqual(r1._pack_collection.names(), r2._pack_collection.names())
 
1080
                self.assertEqual(1, len(r1._pack_collection.names()))
 
1081
                self.assertFalse(name_to_drop in r1._pack_collection.names())
 
1082
            finally:
 
1083
                r2.unlock()
 
1084
        finally:
 
1085
            r1.unlock()
 
1086
 
 
1087
    def test_lock_write_does_not_physically_lock(self):
 
1088
        repo = self.make_repository('.', format=self.get_format())
 
1089
        repo.lock_write()
 
1090
        self.addCleanup(repo.unlock)
 
1091
        self.assertFalse(repo.get_physical_lock_status())
 
1092
 
 
1093
    def prepare_for_break_lock(self):
 
1094
        # Setup the global ui factory state so that a break-lock method call
 
1095
        # will find usable input in the input stream.
 
1096
        old_factory = bzrlib.ui.ui_factory
 
1097
        def restoreFactory():
 
1098
            bzrlib.ui.ui_factory = old_factory
 
1099
        self.addCleanup(restoreFactory)
 
1100
        bzrlib.ui.ui_factory = bzrlib.ui.SilentUIFactory()
 
1101
        bzrlib.ui.ui_factory.stdin = StringIO("y\n")
 
1102
 
 
1103
    def test_break_lock_breaks_physical_lock(self):
 
1104
        repo = self.make_repository('.', format=self.get_format())
 
1105
        repo._pack_collection.lock_names()
 
1106
        repo2 = repository.Repository.open('.')
 
1107
        self.assertTrue(repo.get_physical_lock_status())
 
1108
        self.prepare_for_break_lock()
 
1109
        repo2.break_lock()
 
1110
        self.assertFalse(repo.get_physical_lock_status())
 
1111
 
 
1112
    def test_broken_physical_locks_error_on__unlock_names_lock(self):
 
1113
        repo = self.make_repository('.', format=self.get_format())
 
1114
        repo._pack_collection.lock_names()
 
1115
        self.assertTrue(repo.get_physical_lock_status())
 
1116
        repo2 = repository.Repository.open('.')
 
1117
        self.prepare_for_break_lock()
 
1118
        repo2.break_lock()
 
1119
        self.assertRaises(errors.LockBroken, repo._pack_collection._unlock_names)
 
1120
 
 
1121
    def test_fetch_without_find_ghosts_ignores_ghosts(self):
 
1122
        # we want two repositories at this point:
 
1123
        # one with a revision that is a ghost in the other
 
1124
        # repository.
 
1125
        # 'ghost' is present in has_ghost, 'ghost' is absent in 'missing_ghost'.
 
1126
        # 'references' is present in both repositories, and 'tip' is present
 
1127
        # just in has_ghost.
 
1128
        # has_ghost       missing_ghost
 
1129
        #------------------------------
 
1130
        # 'ghost'             -
 
1131
        # 'references'    'references'
 
1132
        # 'tip'               -
 
1133
        # In this test we fetch 'tip' which should not fetch 'ghost'
 
1134
        has_ghost = self.make_repository('has_ghost', format=self.get_format())
 
1135
        missing_ghost = self.make_repository('missing_ghost',
 
1136
            format=self.get_format())
 
1137
 
 
1138
        def add_commit(repo, revision_id, parent_ids):
 
1139
            repo.lock_write()
 
1140
            repo.start_write_group()
 
1141
            inv = inventory.Inventory(revision_id=revision_id)
 
1142
            inv.root.revision = revision_id
 
1143
            root_id = inv.root.file_id
 
1144
            sha1 = repo.add_inventory(revision_id, inv, [])
 
1145
            vf = repo.weave_store.get_weave_or_empty(root_id,
 
1146
                repo.get_transaction())
 
1147
            vf.add_lines(revision_id, [], [])
 
1148
            rev = bzrlib.revision.Revision(timestamp=0,
 
1149
                                           timezone=None,
 
1150
                                           committer="Foo Bar <foo@example.com>",
 
1151
                                           message="Message",
 
1152
                                           inventory_sha1=sha1,
 
1153
                                           revision_id=revision_id)
 
1154
            rev.parent_ids = parent_ids
 
1155
            repo.add_revision(revision_id, rev)
 
1156
            repo.commit_write_group()
 
1157
            repo.unlock()
 
1158
        add_commit(has_ghost, 'ghost', [])
 
1159
        add_commit(has_ghost, 'references', ['ghost'])
 
1160
        add_commit(missing_ghost, 'references', ['ghost'])
 
1161
        add_commit(has_ghost, 'tip', ['references'])
 
1162
        missing_ghost.fetch(has_ghost, 'tip')
 
1163
        # missing ghost now has tip and not ghost.
 
1164
        rev = missing_ghost.get_revision('tip')
 
1165
        inv = missing_ghost.get_inventory('tip')
 
1166
        self.assertRaises(errors.NoSuchRevision,
 
1167
            missing_ghost.get_revision, 'ghost')
 
1168
        self.assertRaises(errors.RevisionNotPresent,
 
1169
            missing_ghost.get_inventory, 'ghost')
 
1170
 
 
1171
 
 
1172
class TestKnitPackSubtrees(TestKnitPackNoSubtrees):
 
1173
 
 
1174
    def get_format(self):
 
1175
        return bzrdir.format_registry.make_bzrdir(
 
1176
            'pack-0.92-subtree')
 
1177
 
 
1178
    def check_format(self, t):
 
1179
        self.assertEqualDiff(
 
1180
            "Bazaar pack repository format 1 with subtree support (needs bzr 0.92)\n",
 
1181
            t.get('format').read())
1106
1182
 
1107
1183
 
1108
1184
class TestRepositoryPackCollection(TestCaseWithTransport):
1110
1186
    def get_format(self):
1111
1187
        return bzrdir.format_registry.make_bzrdir('pack-0.92')
1112
1188
 
1113
 
    def get_packs(self):
1114
 
        format = self.get_format()
1115
 
        repo = self.make_repository('.', format=format)
1116
 
        return repo._pack_collection
1117
 
 
1118
 
    def make_packs_and_alt_repo(self, write_lock=False):
1119
 
        """Create a pack repo with 3 packs, and access it via a second repo."""
1120
 
        tree = self.make_branch_and_tree('.', format=self.get_format())
1121
 
        tree.lock_write()
1122
 
        self.addCleanup(tree.unlock)
1123
 
        rev1 = tree.commit('one')
1124
 
        rev2 = tree.commit('two')
1125
 
        rev3 = tree.commit('three')
1126
 
        r = repository.Repository.open('.')
1127
 
        if write_lock:
1128
 
            r.lock_write()
1129
 
        else:
1130
 
            r.lock_read()
1131
 
        self.addCleanup(r.unlock)
1132
 
        packs = r._pack_collection
1133
 
        packs.ensure_loaded()
1134
 
        return tree, r, packs, [rev1, rev2, rev3]
1135
 
 
1136
 
    def test__clear_obsolete_packs(self):
1137
 
        packs = self.get_packs()
1138
 
        obsolete_pack_trans = packs.transport.clone('obsolete_packs')
1139
 
        obsolete_pack_trans.put_bytes('a-pack.pack', 'content\n')
1140
 
        obsolete_pack_trans.put_bytes('a-pack.rix', 'content\n')
1141
 
        obsolete_pack_trans.put_bytes('a-pack.iix', 'content\n')
1142
 
        obsolete_pack_trans.put_bytes('another-pack.pack', 'foo\n')
1143
 
        obsolete_pack_trans.put_bytes('not-a-pack.rix', 'foo\n')
1144
 
        res = packs._clear_obsolete_packs()
1145
 
        self.assertEqual(['a-pack', 'another-pack'], sorted(res))
1146
 
        self.assertEqual([], obsolete_pack_trans.list_dir('.'))
1147
 
 
1148
 
    def test__clear_obsolete_packs_preserve(self):
1149
 
        packs = self.get_packs()
1150
 
        obsolete_pack_trans = packs.transport.clone('obsolete_packs')
1151
 
        obsolete_pack_trans.put_bytes('a-pack.pack', 'content\n')
1152
 
        obsolete_pack_trans.put_bytes('a-pack.rix', 'content\n')
1153
 
        obsolete_pack_trans.put_bytes('a-pack.iix', 'content\n')
1154
 
        obsolete_pack_trans.put_bytes('another-pack.pack', 'foo\n')
1155
 
        obsolete_pack_trans.put_bytes('not-a-pack.rix', 'foo\n')
1156
 
        res = packs._clear_obsolete_packs(preserve=set(['a-pack']))
1157
 
        self.assertEqual(['a-pack', 'another-pack'], sorted(res))
1158
 
        self.assertEqual(['a-pack.iix', 'a-pack.pack', 'a-pack.rix'],
1159
 
                         sorted(obsolete_pack_trans.list_dir('.')))
1160
 
 
1161
1189
    def test__max_pack_count(self):
1162
1190
        """The maximum pack count is a function of the number of revisions."""
 
1191
        format = self.get_format()
 
1192
        repo = self.make_repository('.', format=format)
 
1193
        packs = repo._pack_collection
1163
1194
        # no revisions - one pack, so that we can have a revision free repo
1164
1195
        # without it blowing up
1165
 
        packs = self.get_packs()
1166
1196
        self.assertEqual(1, packs._max_pack_count(0))
1167
1197
        # after that the sum of the digits, - check the first 1-9
1168
1198
        self.assertEqual(1, packs._max_pack_count(1))
1183
1213
        # check some arbitrary big numbers
1184
1214
        self.assertEqual(25, packs._max_pack_count(112894))
1185
1215
 
1186
 
    def test_repr(self):
1187
 
        packs = self.get_packs()
1188
 
        self.assertContainsRe(repr(packs),
1189
 
            'RepositoryPackCollection(.*Repository(.*))')
1190
 
 
1191
 
    def test__obsolete_packs(self):
1192
 
        tree, r, packs, revs = self.make_packs_and_alt_repo(write_lock=True)
1193
 
        names = packs.names()
1194
 
        pack = packs.get_pack_by_name(names[0])
1195
 
        # Schedule this one for removal
1196
 
        packs._remove_pack_from_memory(pack)
1197
 
        # Simulate a concurrent update by renaming the .pack file and one of
1198
 
        # the indices
1199
 
        packs.transport.rename('packs/%s.pack' % (names[0],),
1200
 
                               'obsolete_packs/%s.pack' % (names[0],))
1201
 
        packs.transport.rename('indices/%s.iix' % (names[0],),
1202
 
                               'obsolete_packs/%s.iix' % (names[0],))
1203
 
        # Now trigger the obsoletion, and ensure that all the remaining files
1204
 
        # are still renamed
1205
 
        packs._obsolete_packs([pack])
1206
 
        self.assertEqual([n + '.pack' for n in names[1:]],
1207
 
                         sorted(packs._pack_transport.list_dir('.')))
1208
 
        # names[0] should not be present in the index anymore
1209
 
        self.assertEqual(names[1:],
1210
 
            sorted(set([osutils.splitext(n)[0] for n in
1211
 
                        packs._index_transport.list_dir('.')])))
1212
 
 
1213
1216
    def test_pack_distribution_zero(self):
1214
 
        packs = self.get_packs()
 
1217
        format = self.get_format()
 
1218
        repo = self.make_repository('.', format=format)
 
1219
        packs = repo._pack_collection
1215
1220
        self.assertEqual([0], packs.pack_distribution(0))
1216
1221
 
1217
1222
    def test_ensure_loaded_unlocked(self):
1218
 
        packs = self.get_packs()
 
1223
        format = self.get_format()
 
1224
        repo = self.make_repository('.', format=format)
1219
1225
        self.assertRaises(errors.ObjectNotLocked,
1220
 
                          packs.ensure_loaded)
 
1226
                          repo._pack_collection.ensure_loaded)
1221
1227
 
1222
1228
    def test_pack_distribution_one_to_nine(self):
1223
 
        packs = self.get_packs()
 
1229
        format = self.get_format()
 
1230
        repo = self.make_repository('.', format=format)
 
1231
        packs = repo._pack_collection
1224
1232
        self.assertEqual([1],
1225
1233
            packs.pack_distribution(1))
1226
1234
        self.assertEqual([1, 1],
1242
1250
 
1243
1251
    def test_pack_distribution_stable_at_boundaries(self):
1244
1252
        """When there are multi-rev packs the counts are stable."""
1245
 
        packs = self.get_packs()
 
1253
        format = self.get_format()
 
1254
        repo = self.make_repository('.', format=format)
 
1255
        packs = repo._pack_collection
1246
1256
        # in 10s:
1247
1257
        self.assertEqual([10], packs.pack_distribution(10))
1248
1258
        self.assertEqual([10, 1], packs.pack_distribution(11))
1257
1267
        self.assertEqual([100, 100, 10, 1], packs.pack_distribution(211))
1258
1268
 
1259
1269
    def test_plan_pack_operations_2009_revisions_skip_all_packs(self):
1260
 
        packs = self.get_packs()
 
1270
        format = self.get_format()
 
1271
        repo = self.make_repository('.', format=format)
 
1272
        packs = repo._pack_collection
1261
1273
        existing_packs = [(2000, "big"), (9, "medium")]
1262
1274
        # rev count - 2009 -> 2x1000 + 9x1
1263
1275
        pack_operations = packs.plan_autopack_combinations(
1265
1277
        self.assertEqual([], pack_operations)
1266
1278
 
1267
1279
    def test_plan_pack_operations_2010_revisions_skip_all_packs(self):
1268
 
        packs = self.get_packs()
 
1280
        format = self.get_format()
 
1281
        repo = self.make_repository('.', format=format)
 
1282
        packs = repo._pack_collection
1269
1283
        existing_packs = [(2000, "big"), (9, "medium"), (1, "single")]
1270
1284
        # rev count - 2010 -> 2x1000 + 1x10
1271
1285
        pack_operations = packs.plan_autopack_combinations(
1273
1287
        self.assertEqual([], pack_operations)
1274
1288
 
1275
1289
    def test_plan_pack_operations_2010_combines_smallest_two(self):
1276
 
        packs = self.get_packs()
 
1290
        format = self.get_format()
 
1291
        repo = self.make_repository('.', format=format)
 
1292
        packs = repo._pack_collection
1277
1293
        existing_packs = [(1999, "big"), (9, "medium"), (1, "single2"),
1278
1294
            (1, "single1")]
1279
1295
        # rev count - 2010 -> 2x1000 + 1x10 (3)
1280
1296
        pack_operations = packs.plan_autopack_combinations(
1281
1297
            existing_packs, [1000, 1000, 10])
1282
 
        self.assertEqual([[2, ["single2", "single1"]]], pack_operations)
1283
 
 
1284
 
    def test_plan_pack_operations_creates_a_single_op(self):
1285
 
        packs = self.get_packs()
1286
 
        existing_packs = [(50, 'a'), (40, 'b'), (30, 'c'), (10, 'd'),
1287
 
                          (10, 'e'), (6, 'f'), (4, 'g')]
1288
 
        # rev count 150 -> 1x100 and 5x10
1289
 
        # The two size 10 packs do not need to be touched. The 50, 40, 30 would
1290
 
        # be combined into a single 120 size pack, and the 6 & 4 would
1291
 
        # becombined into a size 10 pack. However, if we have to rewrite them,
1292
 
        # we save a pack file with no increased I/O by putting them into the
1293
 
        # same file.
1294
 
        distribution = packs.pack_distribution(150)
1295
 
        pack_operations = packs.plan_autopack_combinations(existing_packs,
1296
 
                                                           distribution)
1297
 
        self.assertEqual([[130, ['a', 'b', 'c', 'f', 'g']]], pack_operations)
 
1298
        self.assertEqual([[2, ["single2", "single1"]], [0, []]], pack_operations)
1298
1299
 
1299
1300
    def test_all_packs_none(self):
1300
1301
        format = self.get_format()
1338
1339
        tree.lock_read()
1339
1340
        self.addCleanup(tree.unlock)
1340
1341
        packs = tree.branch.repository._pack_collection
1341
 
        packs.reset()
1342
1342
        packs.ensure_loaded()
1343
1343
        name = packs.names()[0]
1344
1344
        pack_1 = packs.get_pack_by_name(name)
1345
1345
        # the pack should be correctly initialised
1346
 
        sizes = packs._names[name]
1347
 
        rev_index = GraphIndex(packs._index_transport, name + '.rix', sizes[0])
1348
 
        inv_index = GraphIndex(packs._index_transport, name + '.iix', sizes[1])
1349
 
        txt_index = GraphIndex(packs._index_transport, name + '.tix', sizes[2])
1350
 
        sig_index = GraphIndex(packs._index_transport, name + '.six', sizes[3])
 
1346
        rev_index = GraphIndex(packs._index_transport, name + '.rix',
 
1347
            packs._names[name][0])
 
1348
        inv_index = GraphIndex(packs._index_transport, name + '.iix',
 
1349
            packs._names[name][1])
 
1350
        txt_index = GraphIndex(packs._index_transport, name + '.tix',
 
1351
            packs._names[name][2])
 
1352
        sig_index = GraphIndex(packs._index_transport, name + '.six',
 
1353
            packs._names[name][3])
1351
1354
        self.assertEqual(pack_repo.ExistingPack(packs._pack_transport,
1352
1355
            name, rev_index, inv_index, txt_index, sig_index), pack_1)
1353
1356
        # and the same instance should be returned on successive calls.
1354
1357
        self.assertTrue(pack_1 is packs.get_pack_by_name(name))
1355
1358
 
1356
 
    def test_reload_pack_names_new_entry(self):
1357
 
        tree, r, packs, revs = self.make_packs_and_alt_repo()
1358
 
        names = packs.names()
1359
 
        # Add a new pack file into the repository
1360
 
        rev4 = tree.commit('four')
1361
 
        new_names = tree.branch.repository._pack_collection.names()
1362
 
        new_name = set(new_names).difference(names)
1363
 
        self.assertEqual(1, len(new_name))
1364
 
        new_name = new_name.pop()
1365
 
        # The old collection hasn't noticed yet
1366
 
        self.assertEqual(names, packs.names())
1367
 
        self.assertTrue(packs.reload_pack_names())
1368
 
        self.assertEqual(new_names, packs.names())
1369
 
        # And the repository can access the new revision
1370
 
        self.assertEqual({rev4:(revs[-1],)}, r.get_parent_map([rev4]))
1371
 
        self.assertFalse(packs.reload_pack_names())
1372
 
 
1373
 
    def test_reload_pack_names_added_and_removed(self):
1374
 
        tree, r, packs, revs = self.make_packs_and_alt_repo()
1375
 
        names = packs.names()
1376
 
        # Now repack the whole thing
1377
 
        tree.branch.repository.pack()
1378
 
        new_names = tree.branch.repository._pack_collection.names()
1379
 
        # The other collection hasn't noticed yet
1380
 
        self.assertEqual(names, packs.names())
1381
 
        self.assertTrue(packs.reload_pack_names())
1382
 
        self.assertEqual(new_names, packs.names())
1383
 
        self.assertEqual({revs[-1]:(revs[-2],)}, r.get_parent_map([revs[-1]]))
1384
 
        self.assertFalse(packs.reload_pack_names())
1385
 
 
1386
 
    def test_reload_pack_names_preserves_pending(self):
1387
 
        # TODO: Update this to also test for pending-deleted names
1388
 
        tree, r, packs, revs = self.make_packs_and_alt_repo(write_lock=True)
1389
 
        # We will add one pack (via start_write_group + insert_record_stream),
1390
 
        # and remove another pack (via _remove_pack_from_memory)
1391
 
        orig_names = packs.names()
1392
 
        orig_at_load = packs._packs_at_load
1393
 
        to_remove_name = iter(orig_names).next()
1394
 
        r.start_write_group()
1395
 
        self.addCleanup(r.abort_write_group)
1396
 
        r.texts.insert_record_stream([versionedfile.FulltextContentFactory(
1397
 
            ('text', 'rev'), (), None, 'content\n')])
1398
 
        new_pack = packs._new_pack
1399
 
        self.assertTrue(new_pack.data_inserted())
1400
 
        new_pack.finish()
1401
 
        packs.allocate(new_pack)
1402
 
        packs._new_pack = None
1403
 
        removed_pack = packs.get_pack_by_name(to_remove_name)
1404
 
        packs._remove_pack_from_memory(removed_pack)
1405
 
        names = packs.names()
1406
 
        all_nodes, deleted_nodes, new_nodes, _ = packs._diff_pack_names()
1407
 
        new_names = set([x[0][0] for x in new_nodes])
1408
 
        self.assertEqual(names, sorted([x[0][0] for x in all_nodes]))
1409
 
        self.assertEqual(set(names) - set(orig_names), new_names)
1410
 
        self.assertEqual(set([new_pack.name]), new_names)
1411
 
        self.assertEqual([to_remove_name],
1412
 
                         sorted([x[0][0] for x in deleted_nodes]))
1413
 
        packs.reload_pack_names()
1414
 
        reloaded_names = packs.names()
1415
 
        self.assertEqual(orig_at_load, packs._packs_at_load)
1416
 
        self.assertEqual(names, reloaded_names)
1417
 
        all_nodes, deleted_nodes, new_nodes, _ = packs._diff_pack_names()
1418
 
        new_names = set([x[0][0] for x in new_nodes])
1419
 
        self.assertEqual(names, sorted([x[0][0] for x in all_nodes]))
1420
 
        self.assertEqual(set(names) - set(orig_names), new_names)
1421
 
        self.assertEqual(set([new_pack.name]), new_names)
1422
 
        self.assertEqual([to_remove_name],
1423
 
                         sorted([x[0][0] for x in deleted_nodes]))
1424
 
 
1425
 
    def test_autopack_obsoletes_new_pack(self):
1426
 
        tree, r, packs, revs = self.make_packs_and_alt_repo(write_lock=True)
1427
 
        packs._max_pack_count = lambda x: 1
1428
 
        packs.pack_distribution = lambda x: [10]
1429
 
        r.start_write_group()
1430
 
        r.revisions.insert_record_stream([versionedfile.FulltextContentFactory(
1431
 
            ('bogus-rev',), (), None, 'bogus-content\n')])
1432
 
        # This should trigger an autopack, which will combine everything into a
1433
 
        # single pack file.
1434
 
        new_names = r.commit_write_group()
1435
 
        names = packs.names()
1436
 
        self.assertEqual(1, len(names))
1437
 
        self.assertEqual([names[0] + '.pack'],
1438
 
                         packs._pack_transport.list_dir('.'))
1439
 
 
1440
 
    def test_autopack_reloads_and_stops(self):
1441
 
        tree, r, packs, revs = self.make_packs_and_alt_repo(write_lock=True)
1442
 
        # After we have determined what needs to be autopacked, trigger a
1443
 
        # full-pack via the other repo which will cause us to re-evaluate and
1444
 
        # decide we don't need to do anything
1445
 
        orig_execute = packs._execute_pack_operations
1446
 
        def _munged_execute_pack_ops(*args, **kwargs):
1447
 
            tree.branch.repository.pack()
1448
 
            return orig_execute(*args, **kwargs)
1449
 
        packs._execute_pack_operations = _munged_execute_pack_ops
1450
 
        packs._max_pack_count = lambda x: 1
1451
 
        packs.pack_distribution = lambda x: [10]
1452
 
        self.assertFalse(packs.autopack())
1453
 
        self.assertEqual(1, len(packs.names()))
1454
 
        self.assertEqual(tree.branch.repository._pack_collection.names(),
1455
 
                         packs.names())
1456
 
 
1457
 
    def test__save_pack_names(self):
1458
 
        tree, r, packs, revs = self.make_packs_and_alt_repo(write_lock=True)
1459
 
        names = packs.names()
1460
 
        pack = packs.get_pack_by_name(names[0])
1461
 
        packs._remove_pack_from_memory(pack)
1462
 
        packs._save_pack_names(obsolete_packs=[pack])
1463
 
        cur_packs = packs._pack_transport.list_dir('.')
1464
 
        self.assertEqual([n + '.pack' for n in names[1:]], sorted(cur_packs))
1465
 
        # obsolete_packs will also have stuff like .rix and .iix present.
1466
 
        obsolete_packs = packs.transport.list_dir('obsolete_packs')
1467
 
        obsolete_names = set([osutils.splitext(n)[0] for n in obsolete_packs])
1468
 
        self.assertEqual([pack.name], sorted(obsolete_names))
1469
 
 
1470
 
    def test__save_pack_names_already_obsoleted(self):
1471
 
        tree, r, packs, revs = self.make_packs_and_alt_repo(write_lock=True)
1472
 
        names = packs.names()
1473
 
        pack = packs.get_pack_by_name(names[0])
1474
 
        packs._remove_pack_from_memory(pack)
1475
 
        # We are going to simulate a concurrent autopack by manually obsoleting
1476
 
        # the pack directly.
1477
 
        packs._obsolete_packs([pack])
1478
 
        packs._save_pack_names(clear_obsolete_packs=True,
1479
 
                               obsolete_packs=[pack])
1480
 
        cur_packs = packs._pack_transport.list_dir('.')
1481
 
        self.assertEqual([n + '.pack' for n in names[1:]], sorted(cur_packs))
1482
 
        # Note that while we set clear_obsolete_packs=True, it should not
1483
 
        # delete a pack file that we have also scheduled for obsoletion.
1484
 
        obsolete_packs = packs.transport.list_dir('obsolete_packs')
1485
 
        obsolete_names = set([osutils.splitext(n)[0] for n in obsolete_packs])
1486
 
        self.assertEqual([pack.name], sorted(obsolete_names))
1487
 
 
1488
 
 
1489
1359
 
1490
1360
class TestPack(TestCaseWithTransport):
1491
1361
    """Tests for the Pack object."""
1545
1415
        pack_transport = self.get_transport('pack')
1546
1416
        index_transport = self.get_transport('index')
1547
1417
        upload_transport.mkdir('.')
1548
 
        collection = pack_repo.RepositoryPackCollection(
1549
 
            repo=None,
1550
 
            transport=self.get_transport('.'),
1551
 
            index_transport=index_transport,
1552
 
            upload_transport=upload_transport,
1553
 
            pack_transport=pack_transport,
1554
 
            index_builder_class=BTreeBuilder,
1555
 
            index_class=BTreeGraphIndex,
1556
 
            use_chk_index=False)
1557
 
        pack = pack_repo.NewPack(collection)
1558
 
        self.addCleanup(pack.abort) # Make sure the write stream gets closed
1559
 
        self.assertIsInstance(pack.revision_index, BTreeBuilder)
1560
 
        self.assertIsInstance(pack.inventory_index, BTreeBuilder)
1561
 
        self.assertIsInstance(pack._hash, type(osutils.md5()))
 
1418
        pack = pack_repo.NewPack(upload_transport, index_transport,
 
1419
            pack_transport)
 
1420
        self.assertIsInstance(pack.revision_index, InMemoryGraphIndex)
 
1421
        self.assertIsInstance(pack.inventory_index, InMemoryGraphIndex)
 
1422
        self.assertIsInstance(pack._hash, type(md5.new()))
1562
1423
        self.assertTrue(pack.upload_transport is upload_transport)
1563
1424
        self.assertTrue(pack.index_transport is index_transport)
1564
1425
        self.assertTrue(pack.pack_transport is pack_transport)
1571
1432
class TestPacker(TestCaseWithTransport):
1572
1433
    """Tests for the packs repository Packer class."""
1573
1434
 
1574
 
    def test_pack_optimizes_pack_order(self):
1575
 
        builder = self.make_branch_builder('.', format="1.9")
1576
 
        builder.start_series()
1577
 
        builder.build_snapshot('A', None, [
1578
 
            ('add', ('', 'root-id', 'directory', None)),
1579
 
            ('add', ('f', 'f-id', 'file', 'content\n'))])
1580
 
        builder.build_snapshot('B', ['A'],
1581
 
            [('modify', ('f-id', 'new-content\n'))])
1582
 
        builder.build_snapshot('C', ['B'],
1583
 
            [('modify', ('f-id', 'third-content\n'))])
1584
 
        builder.build_snapshot('D', ['C'],
1585
 
            [('modify', ('f-id', 'fourth-content\n'))])
1586
 
        b = builder.get_branch()
1587
 
        b.lock_read()
1588
 
        builder.finish_series()
1589
 
        self.addCleanup(b.unlock)
1590
 
        # At this point, we should have 4 pack files available
1591
 
        # Because of how they were built, they correspond to
1592
 
        # ['D', 'C', 'B', 'A']
1593
 
        packs = b.repository._pack_collection.packs
1594
 
        packer = pack_repo.Packer(b.repository._pack_collection,
1595
 
                                  packs, 'testing',
1596
 
                                  revision_ids=['B', 'C'])
1597
 
        # Now, when we are copying the B & C revisions, their pack files should
1598
 
        # be moved to the front of the stack
1599
 
        # The new ordering moves B & C to the front of the .packs attribute,
1600
 
        # and leaves the others in the original order.
1601
 
        new_packs = [packs[1], packs[2], packs[0], packs[3]]
1602
 
        new_pack = packer.pack()
1603
 
        self.assertEqual(new_packs, packer.packs)
1604
 
 
1605
 
 
1606
 
class TestOptimisingPacker(TestCaseWithTransport):
1607
 
    """Tests for the OptimisingPacker class."""
1608
 
 
1609
 
    def get_pack_collection(self):
1610
 
        repo = self.make_repository('.')
1611
 
        return repo._pack_collection
1612
 
 
1613
 
    def test_open_pack_will_optimise(self):
1614
 
        packer = pack_repo.OptimisingPacker(self.get_pack_collection(),
1615
 
                                            [], '.test')
1616
 
        new_pack = packer.open_pack()
1617
 
        self.addCleanup(new_pack.abort) # ensure cleanup
1618
 
        self.assertIsInstance(new_pack, pack_repo.NewPack)
1619
 
        self.assertTrue(new_pack.revision_index._optimize_for_size)
1620
 
        self.assertTrue(new_pack.inventory_index._optimize_for_size)
1621
 
        self.assertTrue(new_pack.text_index._optimize_for_size)
1622
 
        self.assertTrue(new_pack.signature_index._optimize_for_size)
1623
 
 
1624
 
 
1625
 
class TestCrossFormatPacks(TestCaseWithTransport):
1626
 
 
1627
 
    def log_pack(self, hint=None):
1628
 
        self.calls.append(('pack', hint))
1629
 
        self.orig_pack(hint=hint)
1630
 
        if self.expect_hint:
1631
 
            self.assertTrue(hint)
1632
 
 
1633
 
    def run_stream(self, src_fmt, target_fmt, expect_pack_called):
1634
 
        self.expect_hint = expect_pack_called
1635
 
        self.calls = []
1636
 
        source_tree = self.make_branch_and_tree('src', format=src_fmt)
1637
 
        source_tree.lock_write()
1638
 
        self.addCleanup(source_tree.unlock)
1639
 
        tip = source_tree.commit('foo')
1640
 
        target = self.make_repository('target', format=target_fmt)
1641
 
        target.lock_write()
1642
 
        self.addCleanup(target.unlock)
1643
 
        source = source_tree.branch.repository._get_source(target._format)
1644
 
        self.orig_pack = target.pack
1645
 
        target.pack = self.log_pack
1646
 
        search = target.search_missing_revision_ids(
1647
 
            source_tree.branch.repository, tip)
1648
 
        stream = source.get_stream(search)
1649
 
        from_format = source_tree.branch.repository._format
1650
 
        sink = target._get_sink()
1651
 
        sink.insert_stream(stream, from_format, [])
1652
 
        if expect_pack_called:
1653
 
            self.assertLength(1, self.calls)
1654
 
        else:
1655
 
            self.assertLength(0, self.calls)
1656
 
 
1657
 
    def run_fetch(self, src_fmt, target_fmt, expect_pack_called):
1658
 
        self.expect_hint = expect_pack_called
1659
 
        self.calls = []
1660
 
        source_tree = self.make_branch_and_tree('src', format=src_fmt)
1661
 
        source_tree.lock_write()
1662
 
        self.addCleanup(source_tree.unlock)
1663
 
        tip = source_tree.commit('foo')
1664
 
        target = self.make_repository('target', format=target_fmt)
1665
 
        target.lock_write()
1666
 
        self.addCleanup(target.unlock)
1667
 
        source = source_tree.branch.repository
1668
 
        self.orig_pack = target.pack
1669
 
        target.pack = self.log_pack
1670
 
        target.fetch(source)
1671
 
        if expect_pack_called:
1672
 
            self.assertLength(1, self.calls)
1673
 
        else:
1674
 
            self.assertLength(0, self.calls)
1675
 
 
1676
 
    def test_sink_format_hint_no(self):
1677
 
        # When the target format says packing makes no difference, pack is not
1678
 
        # called.
1679
 
        self.run_stream('1.9', 'rich-root-pack', False)
1680
 
 
1681
 
    def test_sink_format_hint_yes(self):
1682
 
        # When the target format says packing makes a difference, pack is
1683
 
        # called.
1684
 
        self.run_stream('1.9', '2a', True)
1685
 
 
1686
 
    def test_sink_format_same_no(self):
1687
 
        # When the formats are the same, pack is not called.
1688
 
        self.run_stream('2a', '2a', False)
1689
 
 
1690
 
    def test_IDS_format_hint_no(self):
1691
 
        # When the target format says packing makes no difference, pack is not
1692
 
        # called.
1693
 
        self.run_fetch('1.9', 'rich-root-pack', False)
1694
 
 
1695
 
    def test_IDS_format_hint_yes(self):
1696
 
        # When the target format says packing makes a difference, pack is
1697
 
        # called.
1698
 
        self.run_fetch('1.9', '2a', True)
1699
 
 
1700
 
    def test_IDS_format_same_no(self):
1701
 
        # When the formats are the same, pack is not called.
1702
 
        self.run_fetch('2a', '2a', False)
 
1435
    # To date, this class has been factored out and nothing new added to it;
 
1436
    # thus there are not yet any tests.
 
1437
 
 
1438
 
 
1439
class TestInterDifferingSerializer(TestCaseWithTransport):
 
1440
 
 
1441
    def test_progress_bar(self):
 
1442
        tree = self.make_branch_and_tree('tree')
 
1443
        tree.commit('rev1', rev_id='rev-1')
 
1444
        tree.commit('rev2', rev_id='rev-2')
 
1445
        tree.commit('rev3', rev_id='rev-3')
 
1446
        repo = self.make_repository('repo')
 
1447
        inter_repo = repository.InterDifferingSerializer(
 
1448
            tree.branch.repository, repo)
 
1449
        pb = progress.InstrumentedProgress(to_file=StringIO())
 
1450
        pb.never_throttle = True
 
1451
        inter_repo.fetch('rev-1', pb)
 
1452
        self.assertEqual('Transferring revisions', pb.last_msg)
 
1453
        self.assertEqual(1, pb.last_cnt)
 
1454
        self.assertEqual(1, pb.last_total)
 
1455
        inter_repo.fetch('rev-3', pb)
 
1456
        self.assertEqual(2, pb.last_cnt)
 
1457
        self.assertEqual(2, pb.last_total)