/brz/remove-bazaar : revision 1551.19.14

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/repofmt/pack_repo.py

Committer: Aaron Bentley
Date: 2007-12-04 00:34:34 UTC
mfrom: (3072 +trunk)
mto: (1551.19.24 Aaron's mergeable stuff)
mto: This revision was merged to the branch mainline in revision 3074.
Revision ID: aaron.bentley@utoronto.ca-20071204003434-4cv0if9v5zwdehib

Merge bzr.dev

files added:
doc/en/tutorials

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/best_practice_intro.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

files renamed:
doc/en/user-guide/centralized_workflow.txt => doc/en/tutorials/centralized_workflow.txt

doc/en/user-guide/tutorial.txt => doc/en/tutorials/tutorial.txt

files modified:
Makefile

NEWS

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commit.py

bzrlib/debug.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/graph.py

bzrlib/help_topics.py

bzrlib/index.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/merge.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/smart/branch.py

bzrlib/smart/medium.py

bzrlib/smart/repository.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/HttpServer.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_http.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/ssh.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

doc/developers/performance-contributing.txt

doc/en/mini-tutorial/index.txt

doc/en/user-guide/authentication_conf.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuration.txt

doc/en/user-guide/conflicts.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/version_info.txt

doc/en/user-reference/hooks.txt

doc/index.txt

tools/win32/bzr.iss.cog

Show diffs side-by-side

added added

removed removed

bzrlib/repofmt/pack_repo.py

pack,

ui,

)

from bzrlib.graph import Graph

from bzrlib.index import (

GraphIndex,

GraphIndexBuilder,

from bzrlib.osutils import rand_chars

from bzrlib.pack import ContainerWriter

from bzrlib.store import revision

from bzrlib import tsort

""")

from bzrlib import (

bzrdir,

added text, reducing memory and object pressure.

"""

def __init__(self, repository, parents, config, timestamp=None,

timezone=None, committer=None, revprops=None,

revision_id=None):

CommitBuilder.__init__(self, repository, parents, config,

timestamp=timestamp, timezone=timezone, committer=committer,

revprops=revprops, revision_id=revision_id)

self._file_graph = Graph(

repository._pack_collection.text_index.combined_index)

def _add_text_to_weave(self, file_id, new_lines, parents, nostore_sha):

return self.repository._pack_collection._add_text_to_weave(file_id,

self._new_revision_id, new_lines, parents, nostore_sha,

self.random_revid)

def _heads(self, file_id, revision_ids):

keys = [(file_id, revision_id) for revision_id in revision_ids]

return set([key[1] for key in self._file_graph.heads(keys)])

class PackRootCommitBuilder(RootCommitBuilder):

"""A subclass of RootCommitBuilder to add texts with pack semantics.

101

added text, reducing memory and object pressure.

102

"""

103

104

def __init__(self, repository, parents, config, timestamp=None,

105

timezone=None, committer=None, revprops=None,

106

revision_id=None):

107

CommitBuilder.__init__(self, repository, parents, config,

108

timestamp=timestamp, timezone=timezone, committer=committer,

109

revprops=revprops, revision_id=revision_id)

110

self._file_graph = Graph(

111

repository._pack_collection.text_index.combined_index)

112

113

def _add_text_to_weave(self, file_id, new_lines, parents, nostore_sha):

114

return self.repository._pack_collection._add_text_to_weave(file_id,

115

self._new_revision_id, new_lines, parents, nostore_sha,

116

self.random_revid)

117

118

def _heads(self, file_id, revision_ids):

119

keys = [(file_id, revision_id) for revision_id in revision_ids]

120

return set([key[1] for key in self._file_graph.heads(keys)])

121

122

123

class Pack(object):

124

"""An in memory proxy for a pack and its indices.

146

174

"""The text index is the name + .tix."""

147

175

return self.index_name('text', name)

148

176

177

def _external_compression_parents_of_texts(self):

178

keys = set()

179

refs = set()

180

for node in self.text_index.iter_all_entries():

181

keys.add(node[1])

182

refs.update(node[3][1])

183

return refs - keys

184

149

185

150

186

class ExistingPack(Pack):

151

187

"""An in memory proxy for an existing .pack and its disk indices."""

346

382

self.pack_transport, self.name,

347

383

time.time() - self.start_time)

348

384

385

def flush(self):

386

"""Flush any current data."""

387

if self._buffer[1]:

388

bytes = ''.join(self._buffer[0])

389

self.write_stream.write(bytes)

390

self._hash.update(bytes)

391

self._buffer[:] = [[], 0]

392

349

393

def index_name(self, index_type, name):

350

394

"""Get the disk name of an index type for pack name 'name'."""

351

395

return name + NewPack.index_definitions[index_type][0]

495

539

self.packs = packs

496

540

self.suffix = suffix

497

541

self.revision_ids = revision_ids

542

# The pack object we are creating.

543

self.new_pack = None

498

544

self._pack_collection = pack_collection

545

# The index layer keys for the revisions being copied. None for 'all

546

# objects'.

547

self._revision_keys = None

548

# What text keys to copy. None for 'all texts'. This is set by

549

# _copy_inventory_texts

550

self._text_filter = None

551

self._extra_init()

552

553

def _extra_init(self):

554

"""A template hook to allow extending the constructor trivially."""

499

555

500

556

def pack(self, pb=None):

501

557

"""Create a new pack by reading data from other packs.

541

597

self._pack_collection._pack_transport, upload_suffix=self.suffix,

542

598

file_mode=self._pack_collection.repo.control_files._file_mode)

543

599

544

def _create_pack_from_packs(self):

545

self.pb.update("Opening pack", 0, 5)

546

new_pack = self.open_pack()

547

# buffer data - we won't be reading-back during the pack creation and

548

# this makes a significant difference on sftp pushes.

549

new_pack.set_write_cache_size(1024*1024)

550

if 'pack' in debug.debug_flags:

551

plain_pack_list = ['%s%s' % (a_pack.pack_transport.base, a_pack.name)

552

for a_pack in self.packs]

553

if self.revision_ids is not None:

554

rev_count = len(self.revision_ids)

555

else:

556

rev_count = 'all'

557

mutter('%s: create_pack: creating pack from source packs: '

558

'%s%s %s revisions wanted %s t=0',

559

time.ctime(), self._pack_collection._upload_transport.base, new_pack.random_name,

560

plain_pack_list, rev_count)

600

def _copy_revision_texts(self):

601

"""Copy revision data to the new pack."""

561

602

# select revisions

562

603

if self.revision_ids:

563

604

revision_keys = [(revision_id,) for revision_id in self.revision_ids]

564

605

else:

565

606

revision_keys = None

566

567

607

# select revision keys

568

608

revision_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

569

609

self.packs, 'revision_index')[0]

571

611

# copy revision keys and adjust values

572

612

self.pb.update("Copying revision texts", 1)

573

613

list(self._copy_nodes_graph(revision_nodes, revision_index_map,

574

new_pack._writer, new_pack.revision_index))

614

self.new_pack._writer, self.new_pack.revision_index))

575

615

if 'pack' in debug.debug_flags:

576

616

mutter('%s: create_pack: revisions copied: %s%s %d items t+%6.3fs',

577

time.ctime(), self._pack_collection._upload_transport.base, new_pack.random_name,

578

new_pack.revision_index.key_count(),

579

time.time() - new_pack.start_time)

617

time.ctime(), self._pack_collection._upload_transport.base,

618

self.new_pack.random_name,

619

self.new_pack.revision_index.key_count(),

620

time.time() - self.new_pack.start_time)

621

self._revision_keys = revision_keys

622

623

def _copy_inventory_texts(self):

624

"""Copy the inventory texts to the new pack.

625

626

self._revision_keys is used to determine what inventories to copy.

627

628

Sets self._text_filter appropriately.

629

"""

580

630

# select inventory keys

581

inv_keys = revision_keys # currently the same keyspace, and note that

631

inv_keys = self._revision_keys # currently the same keyspace, and note that

582

632

# querying for keys here could introduce a bug where an inventory item

583

633

# is missed, so do not change it to query separately without cross

584

634

# checking like the text key check below.

590

640

# at this point.

591

641

self.pb.update("Copying inventory texts", 2)

592

642

inv_lines = self._copy_nodes_graph(inv_nodes, inventory_index_map,

593

new_pack._writer, new_pack.inventory_index, output_lines=True)

643

self.new_pack._writer, self.new_pack.inventory_index, output_lines=True)

594

644

if self.revision_ids:

595

fileid_revisions = self._pack_collection.repo._find_file_ids_from_xml_inventory_lines(

596

inv_lines, self.revision_ids)

597

text_filter = []

598

for fileid, file_revids in fileid_revisions.iteritems():

599

text_filter.extend(

600

[(fileid, file_revid) for file_revid in file_revids])

645

self._process_inventory_lines(inv_lines)

601

646

else:

602

647

# eat the iterator to cause it to execute.

603

648

list(inv_lines)

604

text_filter = None

649

self._text_filter = None

605

650

if 'pack' in debug.debug_flags:

606

651

mutter('%s: create_pack: inventories copied: %s%s %d items t+%6.3fs',

607

time.ctime(), self._pack_collection._upload_transport.base, new_pack.random_name,

608

new_pack.inventory_index.key_count(),

652

time.ctime(), self._pack_collection._upload_transport.base,

653

self.new_pack.random_name,

654

self.new_pack.inventory_index.key_count(),

609

655

time.time() - new_pack.start_time)

656

657

def _copy_text_texts(self):

610

658

# select text keys

611

text_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

612

self.packs, 'text_index')[0]

613

text_nodes = self._pack_collection._index_contents(text_index_map, text_filter)

614

if text_filter is not None:

659

text_index_map, text_nodes = self._get_text_nodes()

660

if self._text_filter is not None:

615

661

# We could return the keys copied as part of the return value from

616

662

# _copy_nodes_graph but this doesn't work all that well with the

617

663

# need to get line output too, so we check separately, and as we're

620

666

# mising records.

621

667

text_nodes = set(text_nodes)

622

668

present_text_keys = set(_node[1] for _node in text_nodes)

623

missing_text_keys = set(text_filter) - present_text_keys

669

missing_text_keys = set(self._text_filter) - present_text_keys

624

670

if missing_text_keys:

625

671

# TODO: raise a specific error that can handle many missing

626

672

# keys.

630

676

# copy text keys and adjust values

631

677

self.pb.update("Copying content texts", 3)

632

678

list(self._copy_nodes_graph(text_nodes, text_index_map,

633

new_pack._writer, new_pack.text_index))

679

self.new_pack._writer, self.new_pack.text_index))

680

self._log_copied_texts()

681

682

def _check_references(self):

683

"""Make sure our external refereneces are present."""

684

external_refs = self.new_pack._external_compression_parents_of_texts()

685

if external_refs:

686

index = self._pack_collection.text_index.combined_index

687

found_items = list(index.iter_entries(external_refs))

688

if len(found_items) != len(external_refs):

689

found_keys = set(k for idx, k, refs, value in found_items)

690

missing_items = external_refs - found_keys

691

missing_file_id, missing_revision_id = missing_items.pop()

692

raise errors.RevisionNotPresent(missing_revision_id,

693

missing_file_id)

694

695

def _create_pack_from_packs(self):

696

self.pb.update("Opening pack", 0, 5)

697

self.new_pack = self.open_pack()

698

new_pack = self.new_pack

699

# buffer data - we won't be reading-back during the pack creation and

700

# this makes a significant difference on sftp pushes.

701

new_pack.set_write_cache_size(1024*1024)

634

702

if 'pack' in debug.debug_flags:

635

mutter('%s: create_pack: file texts copied: %s%s %d items t+%6.3fs',

703

plain_pack_list = ['%s%s' % (a_pack.pack_transport.base, a_pack.name)

704

for a_pack in self.packs]

705

if self.revision_ids is not None:

706

rev_count = len(self.revision_ids)

707

else:

708

rev_count = 'all'

709

mutter('%s: create_pack: creating pack from source packs: '

710

'%s%s %s revisions wanted %s t=0',

636

711

time.ctime(), self._pack_collection._upload_transport.base, new_pack.random_name,

637

new_pack.text_index.key_count(),

638

time.time() - new_pack.start_time)

712

plain_pack_list, rev_count)

713

self._copy_revision_texts()

714

self._copy_inventory_texts()

715

self._copy_text_texts()

639

716

# select signature keys

640

signature_filter = revision_keys # same keyspace

717

signature_filter = self._revision_keys # same keyspace

641

718

signature_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

642

719

self.packs, 'signature_index')[0]

643

720

signature_nodes = self._pack_collection._index_contents(signature_index_map,

651

728

time.ctime(), self._pack_collection._upload_transport.base, new_pack.random_name,

652

729

new_pack.signature_index.key_count(),

653

730

time.time() - new_pack.start_time)

654

if not new_pack.data_inserted():

731

self._check_references()

732

if not self._use_pack(new_pack):

655

733

new_pack.abort()

656

734

return None

657

735

self.pb.update("Finishing pack", 5)

718

796

"""

719

797

pb = ui.ui_factory.nested_progress_bar()

720

798

try:

721

return self._do_copy_nodes_graph(nodes, index_map, writer,

722

write_index, output_lines, pb)

723

finally:

799

for result in self._do_copy_nodes_graph(nodes, index_map, writer,

800

write_index, output_lines, pb):

801

yield result

802

except Exception:

803

# Python 2.4 does not permit try:finally: in a generator.

804

pb.finished()

805

raise

806

else:

724

807

pb.finished()

725

808

726

809

def _do_copy_nodes_graph(self, nodes, index_map, writer, write_index,

779

862

pb.update("Copied record", record_index)

780

863

record_index += 1

781

864

865

def _get_text_nodes(self):

866

text_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

867

self.packs, 'text_index')[0]

868

return text_index_map, self._pack_collection._index_contents(text_index_map,

869

self._text_filter)

870

871

def _log_copied_texts(self):

872

if 'pack' in debug.debug_flags:

873

mutter('%s: create_pack: file texts copied: %s%s %d items t+%6.3fs',

874

time.ctime(), self._pack_collection._upload_transport.base,

875

self.new_pack.random_name,

876

self.new_pack.text_index.key_count(),

877

time.time() - self.new_pack.start_time)

878

879

def _process_inventory_lines(self, inv_lines):

880

"""Use up the inv_lines generator and setup a text key filter."""

881

repo = self._pack_collection.repo

882

fileid_revisions = repo._find_file_ids_from_xml_inventory_lines(

883

inv_lines, self.revision_ids)

884

text_filter = []

885

for fileid, file_revids in fileid_revisions.iteritems():

886

text_filter.extend([(fileid, file_revid) for file_revid in file_revids])

887

self._text_filter = text_filter

888

889

def _use_pack(self, new_pack):

890

"""Return True if new_pack should be used.

891

892

:param new_pack: The pack that has just been created.

893

:return: True if the pack should be used.

894

"""

895

return new_pack.data_inserted()

896

782

897

783

898

class ReconcilePacker(Packer):

784

899

"""A packer which regenerates indices etc as it copies.

787

902

regenerated.

788

903

"""

789

904

905

def _extra_init(self):

906

self._data_changed = False

907

908

def _process_inventory_lines(self, inv_lines):

909

"""Generate a text key reference map rather for reconciling with."""

910

repo = self._pack_collection.repo

911

refs = repo._find_text_key_references_from_xml_inventory_lines(

912

inv_lines)

913

self._text_refs = refs

914

# during reconcile we:

915

# - convert unreferenced texts to full texts

916

# - correct texts which reference a text not copied to be full texts

917

# - copy all others as-is but with corrected parents.

918

# - so at this point we don't know enough to decide what becomes a full

919

# text.

920

self._text_filter = None

921

922

def _copy_text_texts(self):

923

"""generate what texts we should have and then copy."""

924

self.pb.update("Copying content texts", 3)

925

# we have three major tasks here:

926

# 1) generate the ideal index

927

repo = self._pack_collection.repo

928

ancestors = dict([(key[0], tuple(ref[0] for ref in refs[0])) for

929

_1, key, _2, refs in

930

self.new_pack.revision_index.iter_all_entries()])

931

ideal_index = repo._generate_text_key_index(self._text_refs, ancestors)

932

# 2) generate a text_nodes list that contains all the deltas that can

933

# be used as-is, with corrected parents.

934

ok_nodes = []

935

bad_texts = []

936

discarded_nodes = []

937

NULL_REVISION = _mod_revision.NULL_REVISION

938

text_index_map, text_nodes = self._get_text_nodes()

939

for node in text_nodes:

940

# 0 - index

941

# 1 - key

942

# 2 - value

943

# 3 - refs

944

try:

945

ideal_parents = tuple(ideal_index[node[1]])

946

except KeyError:

947

discarded_nodes.append(node)

948

self._data_changed = True

949

else:

950

if ideal_parents == (NULL_REVISION,):

951

ideal_parents = ()

952

if ideal_parents == node[3][0]:

953

# no change needed.

954

ok_nodes.append(node)

955

elif ideal_parents[0:1] == node[3][0][0:1]:

956

# the left most parent is the same, or there are no parents

957

# today. Either way, we can preserve the representation as

958

# long as we change the refs to be inserted.

959

self._data_changed = True

960

ok_nodes.append((node[0], node[1], node[2],

961

(ideal_parents, node[3][1])))

962

self._data_changed = True

963

else:

964

# Reinsert this text completely

965

bad_texts.append((node[1], ideal_parents))

966

self._data_changed = True

967

# we're finished with some data.

968

del ideal_index

969

del text_nodes

970

# 3) bulk copy the ok data

971

list(self._copy_nodes_graph(ok_nodes, text_index_map,

972

self.new_pack._writer, self.new_pack.text_index))

973

# 4) adhoc copy all the other texts.

974

# We have to topologically insert all texts otherwise we can fail to

975

# reconcile when parts of a single delta chain are preserved intact,

976

# and other parts are not. E.g. Discarded->d1->d2->d3. d1 will be

977

# reinserted, and if d3 has incorrect parents it will also be

978

# reinserted. If we insert d3 first, d2 is present (as it was bulk

979

# copied), so we will try to delta, but d2 is not currently able to be

980

# extracted because it's basis d1 is not present. Topologically sorting

981

# addresses this. The following generates a sort for all the texts that

982

# are being inserted without having to reference the entire text key

983

# space (we only topo sort the revisions, which is smaller).

984

topo_order = tsort.topo_sort(ancestors)

985

rev_order = dict(zip(topo_order, range(len(topo_order))))

986

bad_texts.sort(key=lambda key:rev_order[key[0][1]])

987

transaction = repo.get_transaction()

988

file_id_index = GraphIndexPrefixAdapter(

989

self.new_pack.text_index,

990

('blank', ), 1,

991

add_nodes_callback=self.new_pack.text_index.add_nodes)

992

knit_index = KnitGraphIndex(file_id_index,

993

add_callback=file_id_index.add_nodes,

994

deltas=True, parents=True)

995

output_knit = knit.KnitVersionedFile('reconcile-texts',

996

self._pack_collection.transport,

997

None,

998

index=knit_index,

999

access_method=_PackAccess(

1000

{self.new_pack.text_index:self.new_pack.access_tuple()},

1001

(self.new_pack._writer, self.new_pack.text_index)),

1002

factory=knit.KnitPlainFactory())

1003

for key, parent_keys in bad_texts:

1004

# We refer to the new pack to delta data being output.

1005

# A possible improvement would be to catch errors on short reads

1006

# and only flush then.

1007

self.new_pack.flush()

1008

parents = []

1009

for parent_key in parent_keys:

1010

if parent_key[0] != key[0]:

1011

# Graph parents must match the fileid

1012

raise errors.BzrError('Mismatched key parent %r:%r' %

1013

(key, parent_keys))

1014

parents.append(parent_key[1])

1015

source_weave = repo.weave_store.get_weave(key[0], transaction)

1016

text_lines = source_weave.get_lines(key[1])

1017

# adapt the 'knit' to the current file_id.

1018

file_id_index = GraphIndexPrefixAdapter(

1019

self.new_pack.text_index,

1020

(key[0], ), 1,

1021

add_nodes_callback=self.new_pack.text_index.add_nodes)

1022

knit_index._graph_index = file_id_index

1023

knit_index._add_callback = file_id_index.add_nodes

1024

output_knit.add_lines_with_ghosts(

1025

key[1], parents, text_lines, random_id=True, check_content=False)

1026

# 5) check that nothing inserted has a reference outside the keyspace.

1027

missing_text_keys = self.new_pack._external_compression_parents_of_texts()

1028

if missing_text_keys:

1029

raise errors.BzrError('Reference to missing compression parents %r'

1030

% (refs - keys,))

1031

self._log_copied_texts()

1032

1033

def _use_pack(self, new_pack):

1034

"""Override _use_pack to check for reconcile having changed content."""

1035

# XXX: we might be better checking this at the copy time.

1036

original_inventory_keys = set()

1037

inv_index = self._pack_collection.inventory_index.combined_index

1038

for entry in inv_index.iter_all_entries():

1039

original_inventory_keys.add(entry[1])

1040

new_inventory_keys = set()

1041

for entry in new_pack.inventory_index.iter_all_entries():

1042

new_inventory_keys.add(entry[1])

1043

if new_inventory_keys != original_inventory_keys:

1044

self._data_changed = True

1045

return new_pack.data_inserted() and self._data_changed

1046

790

1047

791

1048

class RepositoryPackCollection(object):

792

1049

"""Management of packs within a repository."""

1001

1258

def ensure_loaded(self):

1002

1259

# NB: if you see an assertion error here, its probably access against

1003

1260

# an unlocked repo. Naughty.

1004

assert self.repo.is_locked()

1261

if not self.repo.is_locked():

1262

raise errors.ObjectNotLocked(self.repo)

1005

1263

if self._names is None:

1006

1264

self._names = {}

1007

1265

self._packs_at_load = set()

1042

1300

"""

1043

1301

self.ensure_loaded()

1044

1302

if a_new_pack.name in self._names:

1045

# a collision with the packs we know about (not the only possible

1046

# collision, see NewPack.finish() for some discussion). Remove our

1047

# prior reference to it.

1048

self._remove_pack_from_memory(a_new_pack)

1303

raise errors.BzrError(

1304

'Pack %r already exists in %s' % (a_new_pack.name, self))

1049

1305

self._names[a_new_pack.name] = tuple(a_new_pack.index_sizes)

1050

1306

self.add_pack_to_memory(a_new_pack)

1051

1307

1516

1772

self._transaction = None

1517

1773

# for tests

1518

1774

self._reconcile_does_inventory_gc = True

1519

self._reconcile_fixes_text_parents = False

1775

self._reconcile_fixes_text_parents = True

1520

1776

self._reconcile_backsup_inventory = False

1521

1777

1522

1778

def _abort_write_group(self):

1537

1793

:returns: an iterator yielding tuples of (revison-id, parents-in-index,

1538

1794

parents-in-revision).

1539

1795

"""

1540

assert self.is_locked()

1796

if not self.is_locked():

1797

raise errors.ObjectNotLocked(self)

1541

1798

pb = ui.ui_factory.nested_progress_bar()

1542

1799

result = []

1543

1800

try:

Older »