/brz/remove-bazaar : revision 4385.4.2

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/repofmt/groupcompress_repo.py

Committer: John Arbash Meinel
Date: 2009-07-08 14:37:25 UTC
mfrom: (4516 +trunk)
mto: This revision was merged to the branch mainline in revision 4517.
Revision ID: john@arbash-meinel.com-20090708143725-sc9sjy3mz4cxwxzz

Merge bzr.dev 4516

files added:
bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/send.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_chk_serializer.py

bzrlib/util/bencode.py

doc/developers/bug-handling.txt

doc/index.ru.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/time_graph.py

files removed:
bzrlib/util/tests/test_bencode.py

doc/developers/performance-contributing.txt

files renamed:
bzrlib/_btree_serializer_c.pyx => bzrlib/_btree_serializer_pyx.pyx

bzrlib/_dirstate_helpers_c.h => bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_c.pyx => bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_knit_load_data_c.pyx => bzrlib/_knit_load_data_pyx.pyx

tools/doc_generate/ => bzrlib/doc_generate/

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py => bzrlib/tests/tree_implementations/test_get_file_with_stat.py

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/branch.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/eol.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mail_client.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisiontree.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/bzrdir.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/bzrdir_implementations/test_push.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/sftp.py

bzrlib/transport/trace.py

bzrlib/tree.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/cycle.txt

doc/developers/index.txt

doc/developers/inventory.txt

doc/developers/performance-roadmap.txt

doc/developers/planned-change-integration.txt

doc/developers/releasing.txt

doc/en/developer-guide/HACKING.txt

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.png

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/introducing_bazaar.txt

doc/index.txt

setup.py

tools/win32/build_release.py

Show diffs side-by-side

added added

removed removed

bzrlib/repofmt/groupcompress_repo.py

osutils,

pack,

remote,

repository,

revision as _mod_revision,

trace,

ui,

BTreeGraphIndex,

BTreeBuilder,

)

from bzrlib.index import GraphIndex, GraphIndexBuilder

from bzrlib.groupcompress import (

_GCGraphIndex,

GroupCompressVersionedFiles,

Pack,

NewPack,

KnitPackRepository,

KnitPackStreamSource,

PackRootCommitBuilder,

RepositoryPackCollection,

RepositoryFormatPack,

ResumedPack,

Packer,

)

163

have deltas based on a fallback repository.

164

(See <https://bugs.launchpad.net/bzr/+bug/288751>)

165

"""

166

# Groupcompress packs don't have any external references

166

# Groupcompress packs don't have any external references, arguably CHK

167

# pages have external references, but we cannot 'cheaply' determine

168

# them without actually walking all of the chk pages.

169

170

171

class ResumedGCPack(ResumedPack):

172

173

def _check_references(self):

174

"""Make sure our external compression parents are present."""

175

# See GCPack._check_references for why this is empty

176

177

def _get_external_refs(self, index):

178

# GC repositories don't have compression parents external to a given

179

# pack file

180

return set()

167

181

168

182

169

183

class GCCHKPacker(Packer):

202

216

p_id_roots_set = set()

203

217

stream = source_vf.get_record_stream(keys, 'groupcompress', True)

204

218

for idx, record in enumerate(stream):

219

# Inventories should always be with revisions; assume success.

205

220

bytes = record.get_bytes_as('fulltext')

206

221

chk_inv = inventory.CHKInventory.deserialise(None, bytes,

207

222

record.key)

278

293

stream = source_vf.get_record_stream(cur_keys,

279

294

'as-requested', True)

280

295

for record in stream:

296

if record.storage_kind == 'absent':

297

# An absent CHK record: we assume that the missing

298

# record is in a different pack - e.g. a page not

299

# altered by the commit we're packing.

300

continue

281

301

bytes = record.get_bytes_as('fulltext')

282

302

# We don't care about search_key_func for this code,

283

303

# because we only care about external references.

540

560

class GCRepositoryPackCollection(RepositoryPackCollection):

541

561

542

562

pack_factory = GCPack

543

544

def _already_packed(self):

545

"""Is the collection already packed?"""

546

# Always repack GC repositories for now

547

return False

563

resumed_pack_factory = ResumedGCPack

548

564

549

565

def _execute_pack_operations(self, pack_operations,

550

566

_packer_class=GCCHKPacker,

604

620

self.inventories = GroupCompressVersionedFiles(

605

621

_GCGraphIndex(self._pack_collection.inventory_index.combined_index,

606

622

add_callback=self._pack_collection.inventory_index.add_callback,

607

parents=True, is_locked=self.is_locked),

623

parents=True, is_locked=self.is_locked,

624

inconsistency_fatal=False),

608

625

access=self._pack_collection.inventory_index.data_access)

609

626

self.revisions = GroupCompressVersionedFiles(

610

627

_GCGraphIndex(self._pack_collection.revision_index.combined_index,

611

628

add_callback=self._pack_collection.revision_index.add_callback,

612

parents=True, is_locked=self.is_locked),

629

parents=True, is_locked=self.is_locked,

630

track_external_parent_refs=True),

613

631

access=self._pack_collection.revision_index.data_access,

614

632

delta=False)

615

633

self.signatures = GroupCompressVersionedFiles(

616

634

_GCGraphIndex(self._pack_collection.signature_index.combined_index,

617

635

add_callback=self._pack_collection.signature_index.add_callback,

618

parents=False, is_locked=self.is_locked),

636

parents=False, is_locked=self.is_locked,

637

inconsistency_fatal=False),

619

638

access=self._pack_collection.signature_index.data_access,

620

639

delta=False)

621

640

self.texts = GroupCompressVersionedFiles(

622

641

_GCGraphIndex(self._pack_collection.text_index.combined_index,

623

642

add_callback=self._pack_collection.text_index.add_callback,

624

parents=True, is_locked=self.is_locked),

643

parents=True, is_locked=self.is_locked,

644

inconsistency_fatal=False),

625

645

access=self._pack_collection.text_index.data_access)

626

646

# No parents, individual CHK pages don't have specific ancestry

627

647

self.chk_bytes = GroupCompressVersionedFiles(

628

648

_GCGraphIndex(self._pack_collection.chk_index.combined_index,

629

649

add_callback=self._pack_collection.chk_index.add_callback,

630

parents=False, is_locked=self.is_locked),

650

parents=False, is_locked=self.is_locked,

651

inconsistency_fatal=False),

631

652

access=self._pack_collection.chk_index.data_access)

632

653

# True when the repository object is 'write locked' (as opposed to the

633

654

# physical lock only taken out around changes to the pack-names list.)

657

678

return self._inventory_add_lines(revision_id, parents,

658

679

inv_lines, check_content=False)

659

680

681

def _create_inv_from_null(self, delta, revision_id):

682

"""This will mutate new_inv directly.

683

684

This is a simplified form of create_by_apply_delta which knows that all

685

the old values must be None, so everything is a create.

686

"""

687

serializer = self._format._serializer

688

new_inv = inventory.CHKInventory(serializer.search_key_name)

689

new_inv.revision_id = revision_id

690

entry_to_bytes = new_inv._entry_to_bytes

691

id_to_entry_dict = {}

692

parent_id_basename_dict = {}

693

for old_path, new_path, file_id, entry in delta:

694

if old_path is not None:

695

raise ValueError('Invalid delta, somebody tried to delete %r'

696

' from the NULL_REVISION'

697

% ((old_path, file_id),))

698

if new_path is None:

699

raise ValueError('Invalid delta, delta from NULL_REVISION has'

700

' no new_path %r' % (file_id,))

701

if new_path == '':

702

new_inv.root_id = file_id

703

parent_id_basename_key = ('', '')

704

else:

705

utf8_entry_name = entry.name.encode('utf-8')

706

parent_id_basename_key = (entry.parent_id, utf8_entry_name)

707

new_value = entry_to_bytes(entry)

708

# Populate Caches?

709

# new_inv._path_to_fileid_cache[new_path] = file_id

710

id_to_entry_dict[(file_id,)] = new_value

711

parent_id_basename_dict[parent_id_basename_key] = file_id

712

713

new_inv._populate_from_dicts(self.chk_bytes, id_to_entry_dict,

714

parent_id_basename_dict, maximum_size=serializer.maximum_size)

715

return new_inv

716

660

717

def add_inventory_by_delta(self, basis_revision_id, delta, new_revision_id,

661

718

parents, basis_inv=None, propagate_caches=False):

662

719

"""Add a new inventory expressed as a delta against another revision.

682

739

repository format specific) of the serialized inventory, and the

683

740

resulting inventory.

684

741

"""

685

if basis_revision_id == _mod_revision.NULL_REVISION:

686

return KnitPackRepository.add_inventory_by_delta(self,

687

basis_revision_id, delta, new_revision_id, parents)

688

742

if not self.is_in_write_group():

689

743

raise AssertionError("%r not in write group" % (self,))

690

744

_mod_revision.check_not_reserved_id(new_revision_id)

691

basis_tree = self.revision_tree(basis_revision_id)

692

basis_tree.lock_read()

693

try:

694

if basis_inv is None:

745

basis_tree = None

746

if basis_inv is None:

747

if basis_revision_id == _mod_revision.NULL_REVISION:

748

new_inv = self._create_inv_from_null(delta, new_revision_id)

749

inv_lines = new_inv.to_lines()

750

return self._inventory_add_lines(new_revision_id, parents,

751

inv_lines, check_content=False), new_inv

752

else:

753

basis_tree = self.revision_tree(basis_revision_id)

754

basis_tree.lock_read()

695

755

basis_inv = basis_tree.inventory

756

try:

696

757

result = basis_inv.create_by_apply_delta(delta, new_revision_id,

697

758

propagate_caches=propagate_caches)

698

759

inv_lines = result.to_lines()

699

760

return self._inventory_add_lines(new_revision_id, parents,

700

761

inv_lines, check_content=False), result

701

762

finally:

702

basis_tree.unlock()

763

if basis_tree is not None:

764

basis_tree.unlock()

703

765

704

766

def _iter_inventories(self, revision_ids):

705

767

"""Iterate over many inventory objects."""

719

781

# make it raise to trap naughty direct users.

720

782

raise NotImplementedError(self._iter_inventory_xmls)

721

783

722

def _find_revision_outside_set(self, revision_ids):

723

revision_set = frozenset(revision_ids)

724

for revid in revision_ids:

725

parent_ids = self.get_parent_map([revid]).get(revid, ())

726

for parent in parent_ids:

727

if parent in revision_set:

728

# Parent is not outside the set

729

continue

730

if parent not in self.get_parent_map([parent]):

731

# Parent is a ghost

732

continue

733

return parent

734

return _mod_revision.NULL_REVISION

735

736

def _find_file_keys_to_fetch(self, revision_ids, pb):

737

rich_root = self.supports_rich_root()

738

revision_outside_set = self._find_revision_outside_set(revision_ids)

739

if revision_outside_set == _mod_revision.NULL_REVISION:

740

uninteresting_root_keys = set()

741

else:

742

uninteresting_inv = self.get_inventory(revision_outside_set)

743

uninteresting_root_keys = set([uninteresting_inv.id_to_entry.key()])

744

interesting_root_keys = set()

745

for idx, inv in enumerate(self.iter_inventories(revision_ids)):

746

interesting_root_keys.add(inv.id_to_entry.key())

747

revision_ids = frozenset(revision_ids)

748

file_id_revisions = {}

749

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

750

for record, items in chk_map.iter_interesting_nodes(self.chk_bytes,

751

interesting_root_keys, uninteresting_root_keys,

752

pb=pb):

753

# This is cheating a bit to use the last grabbed 'inv', but it

754

# works

755

for name, bytes in items:

756

(name_utf8, file_id, revision_id) = bytes_to_info(bytes)

757

if not rich_root and name_utf8 == '':

758

continue

759

if revision_id in revision_ids:

760

# Would we rather build this up into file_id => revision

761

# maps?

762

try:

763

file_id_revisions[file_id].add(revision_id)

764

except KeyError:

765

file_id_revisions[file_id] = set([revision_id])

766

for file_id, revisions in file_id_revisions.iteritems():

767

yield ('file', file_id, revisions)

784

def _find_present_inventory_keys(self, revision_keys):

785

parent_map = self.inventories.get_parent_map(revision_keys)

786

present_inventory_keys = set(k for k in parent_map)

787

return present_inventory_keys

768

788

769

789

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

770

790

"""Find the file ids and versions affected by revisions.

776

796

revision_ids. Each altered file-ids has the exact revision_ids that

777

797

altered it listed explicitly.

778

798

"""

779

rich_roots = self.supports_rich_root()

780

result = {}

799

rich_root = self.supports_rich_root()

800

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

801

file_id_revisions = {}

781

802

pb = ui.ui_factory.nested_progress_bar()

782

803

try:

783

total = len(revision_ids)

784

for pos, inv in enumerate(self.iter_inventories(revision_ids)):

785

pb.update("Finding text references", pos, total)

786

for entry in inv.iter_just_entries():

787

if entry.revision != inv.revision_id:

788

continue

789

if not rich_roots and entry.file_id == inv.root_id:

790

continue

791

alterations = result.setdefault(entry.file_id, set([]))

792

alterations.add(entry.revision)

793

return result

804

revision_keys = [(r,) for r in revision_ids]

805

parent_keys = self._find_parent_keys_of_revisions(revision_keys)

806

# TODO: instead of using _find_present_inventory_keys, change the

807

# code paths to allow missing inventories to be tolerated.

808

# However, we only want to tolerate missing parent

809

# inventories, not missing inventories for revision_ids

810

present_parent_inv_keys = self._find_present_inventory_keys(

811

parent_keys)

812

present_parent_inv_ids = set(

813

[k[-1] for k in present_parent_inv_keys])

814

uninteresting_root_keys = set()

815

interesting_root_keys = set()

816

inventories_to_read = set(revision_ids)

817

inventories_to_read.update(present_parent_inv_ids)

818

for inv in self.iter_inventories(inventories_to_read):

819

entry_chk_root_key = inv.id_to_entry.key()

820

if inv.revision_id in present_parent_inv_ids:

821

uninteresting_root_keys.add(entry_chk_root_key)

822

else:

823

interesting_root_keys.add(entry_chk_root_key)

824

825

chk_bytes = self.chk_bytes

826

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

827

interesting_root_keys, uninteresting_root_keys,

828

pb=pb):

829

for name, bytes in items:

830

(name_utf8, file_id, revision_id) = bytes_to_info(bytes)

831

if not rich_root and name_utf8 == '':

832

continue

833

try:

834

file_id_revisions[file_id].add(revision_id)

835

except KeyError:

836

file_id_revisions[file_id] = set([revision_id])

794

837

finally:

795

838

pb.finished()

839

return file_id_revisions

796

840

797

841

def find_text_key_references(self):

798

842

"""Find the text key references within the repository.

843

887

return GroupCHKStreamSource(self, to_format)

844

888

return super(CHKInventoryRepository, self)._get_source(to_format)

845

889

846

def suspend_write_group(self):

847

raise errors.UnsuspendableWriteGroup(self)

848

849

def _resume_write_group(self, tokens):

850

raise errors.UnsuspendableWriteGroup(self)

851

852

853

class GroupCHKStreamSource(repository.StreamSource):

890

891

class GroupCHKStreamSource(KnitPackStreamSource):

854

892

"""Used when both the source and target repo are GroupCHK repos."""

855

893

856

894

def __init__(self, from_repository, to_format):

858

896

super(GroupCHKStreamSource, self).__init__(from_repository, to_format)

859

897

self._revision_keys = None

860

898

self._text_keys = None

899

self._text_fetch_order = 'groupcompress'

861

900

self._chk_id_roots = None

862

901

self._chk_p_id_roots = None

863

902

864

def _get_filtered_inv_stream(self):

903

def _get_inventory_stream(self, inventory_keys, allow_absent=False):

865

904

"""Get a stream of inventory texts.

866

905

867

906

When this function returns, self._chk_id_roots and self._chk_p_id_roots

873

912

id_roots_set = set()

874

913

p_id_roots_set = set()

875

914

source_vf = self.from_repository.inventories

876

stream = source_vf.get_record_stream(self._revision_keys,

915

stream = source_vf.get_record_stream(inventory_keys,

877

916

'groupcompress', True)

878

917

for record in stream:

918

if record.storage_kind == 'absent':

919

if allow_absent:

920

continue

921

else:

922

raise errors.NoSuchRevision(self, record.key)

879

923

bytes = record.get_bytes_as('fulltext')

880

924

chk_inv = inventory.CHKInventory.deserialise(None, bytes,

881

925

record.key)

897

941

p_id_roots_set.clear()

898

942

return ('inventories', _filtered_inv_stream())

899

943

900

def _get_filtered_chk_streams(self, excluded_keys):

944

def _get_filtered_chk_streams(self, excluded_revision_keys):

901

945

self._text_keys = set()

902

excluded_keys.discard(_mod_revision.NULL_REVISION)

903

if not excluded_keys:

946

excluded_revision_keys.discard(_mod_revision.NULL_REVISION)

947

if not excluded_revision_keys:

904

948

uninteresting_root_keys = set()

905

949

uninteresting_pid_root_keys = set()

906

950

else:

951

# filter out any excluded revisions whose inventories are not

952

# actually present

953

# TODO: Update Repository.iter_inventories() to add

954

# ignore_missing=True

955

present_keys = self.from_repository._find_present_inventory_keys(

956

excluded_revision_keys)

957

present_ids = [k[-1] for k in present_keys]

907

958

uninteresting_root_keys = set()

908

959

uninteresting_pid_root_keys = set()

909

for inv in self.from_repository.iter_inventories(excluded_keys):

960

for inv in self.from_repository.iter_inventories(present_ids):

910

961

uninteresting_root_keys.add(inv.id_to_entry.key())

911

962

uninteresting_pid_root_keys.add(

912

963

inv.parent_id_basename_to_file_id.key())

922

973

self._text_keys.add((file_id, revision_id))

923

974

if record is not None:

924

975

yield record

976

# Consumed

977

self._chk_id_roots = None

925

978

yield 'chk_bytes', _filter_id_to_entry()

926

979

def _get_parent_id_basename_to_file_id_pages():

927

980

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

928

981

self._chk_p_id_roots, uninteresting_pid_root_keys):

929

982

if record is not None:

930

983

yield record

984

# Consumed

985

self._chk_p_id_roots = None

931

986

yield 'chk_bytes', _get_parent_id_basename_to_file_id_pages()

932

987

933

def _get_text_stream(self):

934

# Note: We know we don't have to handle adding root keys, because both

935

# the source and target are GCCHK, and those always support rich-roots

936

# We may want to request as 'unordered', in case the source has done a

937

# 'split' packing

938

return ('texts', self.from_repository.texts.get_record_stream(

939

self._text_keys, 'groupcompress', False))

940

941

988

def get_stream(self, search):

942

989

revision_ids = search.get_keys()

943

990

for stream_info in self._fetch_revision_texts(revision_ids):

944

991

yield stream_info

945

992

self._revision_keys = [(rev_id,) for rev_id in revision_ids]

946

yield self._get_filtered_inv_stream()

947

# The keys to exclude are part of the search recipe

948

_, _, exclude_keys, _ = search.get_recipe()

949

for stream_info in self._get_filtered_chk_streams(exclude_keys):

993

yield self._get_inventory_stream(self._revision_keys)

994

# TODO: The keys to exclude might be part of the search recipe

995

# For now, exclude all parents that are at the edge of ancestry, for

996

# which we have inventories

997

from_repo = self.from_repository

998

parent_keys = from_repo._find_parent_keys_of_revisions(

999

self._revision_keys)

1000

for stream_info in self._get_filtered_chk_streams(parent_keys):

950

1001

yield stream_info

951

1002

yield self._get_text_stream()

952

1003

1004

def get_stream_for_missing_keys(self, missing_keys):

1005

# missing keys can only occur when we are byte copying and not

1006

# translating (because translation means we don't send

1007

# unreconstructable deltas ever).

1008

missing_inventory_keys = set()

1009

for key in missing_keys:

1010

if key[0] != 'inventories':

1011

raise AssertionError('The only missing keys we should'

1012

' be filling in are inventory keys, not %s'

1013

% (key[0],))

1014

missing_inventory_keys.add(key[1:])

1015

if self._chk_id_roots or self._chk_p_id_roots:

1016

raise AssertionError('Cannot call get_stream_for_missing_keys'

1017

' untill all of get_stream() has been consumed.')

1018

# Yield the inventory stream, so we can find the chk stream

1019

# Some of the missing_keys will be missing because they are ghosts.

1020

# As such, we can ignore them. The Sink is required to verify there are

1021

# no unavailable texts when the ghost inventories are not filled in.

1022

yield self._get_inventory_stream(missing_inventory_keys,

1023

allow_absent=True)

1024

# We use the empty set for excluded_revision_keys, to make it clear

1025

# that we want to transmit all referenced chk pages.

1026

for stream_info in self._get_filtered_chk_streams(set()):

1027

yield stream_info

1028

953

1029

954

1030

class RepositoryFormatCHK1(RepositoryFormatPack):

955

1031

"""A hashed CHK+group compress pack repository."""

956

1032

957

1033

repository_class = CHKInventoryRepository

1034

supports_external_lookups = True

958

1035

supports_chks = True

959

1036

# For right now, setting this to True gives us InterModel1And2 rather

960

1037

# than InterDifferingSerializer

974

1051

_fetch_order = 'unordered'

975

1052

_fetch_uses_deltas = False # essentially ignored by the groupcompress code.

976

1053

fast_deltas = True

1054

pack_compresses = True

977

1055

978

1056

def _get_matching_bzrdir(self):

979

1057

return bzrdir.format_registry.make_bzrdir('development6-rich-root')

997

1075

if not target_format.rich_root_data:

998

1076

raise errors.BadConversionTarget(

999

1077

'Does not support rich root data.', target_format)

1000

if not getattr(target_format, 'supports_tree_reference', False):

1078

if (self.supports_tree_reference and

1079

not getattr(target_format, 'supports_tree_reference', False)):

1001

1080

raise errors.BadConversionTarget(

1002

1081

'Does not support nested trees', target_format)

1003

1082

1004

1083

1084

1085

class RepositoryFormatCHK2(RepositoryFormatCHK1):

1086

"""A CHK repository that uses the bencode revision serializer."""

1087

1088

_serializer = chk_serializer.chk_bencode_serializer

1089

1090

def _get_matching_bzrdir(self):

1091

return bzrdir.format_registry.make_bzrdir('development7-rich-root')

1092

1093

def _ignore_setting_bzrdir(self, format):

1094

pass

1095

1096

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1097

1098

def get_format_string(self):

1099

"""See RepositoryFormat.get_format_string()."""

1100

return ('Bazaar development format - chk repository with bencode '

1101

'revision serialization (needs bzr.dev from 1.16)\n')

1102

1103

1104

class RepositoryFormat2a(RepositoryFormatCHK2):

1105

"""A CHK repository that uses the bencode revision serializer.

1106

1107

This is the same as RepositoryFormatCHK2 but with a public name.

1108

"""

1109

1110

_serializer = chk_serializer.chk_bencode_serializer

1111

1112

def _get_matching_bzrdir(self):

1113

return bzrdir.format_registry.make_bzrdir('2a')

1114

1115

def _ignore_setting_bzrdir(self, format):

1116

pass

1117

1118

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1119

1120

def get_format_string(self):

1121

return ('Bazaar repository format 2a (needs bzr 1.16 or later)\n')

Older »