/brz/remove-bazaar : revision 3006.3.5

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/repository.py

Committer: Robert Collins
Date: 2008-02-13 03:30:01 UTC
mfrom: (3221 +trunk)
mto: This revision was merged to the branch mainline in revision 3224.
Revision ID: robertc@robertcollins.net-20080213033001-rw70ul0zb02ph856

Merge to fix conflicts.

files added:
bzrlib/help_topics

bzrlib/help_topics/en

bzrlib/switch.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_switch.py

bzrlib/version_info_formats/format_custom.py

contrib/bzr_access

doc/developers/inventory.txt

doc/developers/lca-merge.txt

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/tutorials

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/best_practice_intro.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/revnos.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference/readme.txt

index.txt

files removed:
bzrlib/plugins/multiparent.py

doc/en/user-reference/index.txt

files renamed:
bzrlib/help_topics.py => bzrlib/help_topics/__init__.py

doc/en/user-guide/authentication_conf.txt => bzrlib/help_topics/en/authentication.txt

doc/en/user-guide/configuration.txt => bzrlib/help_topics/en/configuration.txt

doc/en/user-guide/conflicts.txt => bzrlib/help_topics/en/conflicts.txt

doc/en/user-reference/hooks.txt => bzrlib/help_topics/en/hooks.txt

bzrlib/tests/HttpServer.py => bzrlib/tests/http_server.py

bzrlib/tests/HTTPTestUtil.py => bzrlib/tests/http_utils.py

doc/developers/knitpack.txt => doc/developers/packrepo.txt

doc/en/user-guide/centralized_workflow.txt => doc/en/tutorials/centralized_workflow.txt

doc/en/user-guide/tutorial.txt => doc/en/tutorials/tutorial.txt

files modified:
.bzrignore

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_patiencediff_c.c

bzrlib/annotate.py

bzrlib/branch.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/index.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/sign_my_commits.py

bzrlib/smart/branch.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/vfs.py

bzrlib/status.py

bzrlib/symbol_versioning.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/ftp_server.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/version_info_formats/__init__.py

bzrlib/versionedfile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/bundles.txt

doc/developers/index.txt

doc/developers/performance-contributing.txt

doc/en/mini-tutorial/index.txt

doc/en/quick-reference/quick-start-summary.svg

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/version_info.txt

doc/index.txt

setup.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/win32/bzr.iss.cog

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

lazy_regex,

lockable_files,

lockdir,

lru_cache,

osutils,

registry,

remote,

revision as _mod_revision,

symbol_versioning,

transactions,

tsort,

ui,

)

from bzrlib.bundle import serializer

# the default CommitBuilder does not manage trees whose root is versioned.

_versioned_root = False

def __init__(self, repository, parents, config, timestamp=None,

timezone=None, committer=None, revprops=None,

def __init__(self, repository, parents, config, timestamp=None,

timezone=None, committer=None, revprops=None,

revision_id=None):

"""Initiate a CommitBuilder.

116

118

self._timezone = int(timezone)

117

119

118

120

self._generate_revision_if_needed()

119

self._heads = graph.HeadsCache(repository.get_graph()).heads

121

self.__heads = graph.HeadsCache(repository.get_graph()).heads

120

122

121

123

def commit(self, message):

122

124

"""Make the actual commit.

188

190

else:

189

191

self.random_revid = False

190

192

193

def _heads(self, file_id, revision_ids):

194

"""Calculate the graph heads for revision_ids in the graph of file_id.

195

196

This can use either a per-file graph or a global revision graph as we

197

have an identity relationship between the two graphs.

198

"""

199

return self.__heads(revision_ids)

200

191

201

def _check_root(self, ie, parent_invs, tree):

192

202

"""Helper for record_entry_contents.

193

203

285

295

# XXX: Friction: parent_candidates should return a list not a dict

286

296

# so that we don't have to walk the inventories again.

287

297

parent_candiate_entries = ie.parent_candidates(parent_invs)

288

head_set = self._heads(parent_candiate_entries.keys())

298

head_set = self._heads(ie.file_id, parent_candiate_entries.keys())

289

299

heads = []

290

300

for inv in parent_invs:

291

301

if ie.file_id in inv:

485

495

attempted.

486

496

"""

487

497

488

@needs_write_lock

489

498

def add_inventory(self, revision_id, inv, parents):

490

499

"""Add the inventory inv to the repository as revision_id.

491

500

492

501

:param parents: The revision ids of the parents that revision_id

493

502

is known to have and are in the repository already.

494

503

495

returns the sha1 of the serialized inventory.

504

:returns: The validator(which is a sha1 digest, though what is sha'd is

505

repository format specific) of the serialized inventory.

496

506

"""

497

507

assert self.is_in_write_group()

498

508

_mod_revision.check_not_reserved_id(revision_id)

515

525

return inv_vf.add_lines(revision_id, final_parents, lines,

516

526

check_content=check_content)[0]

517

527

518

@needs_write_lock

519

528

def add_revision(self, revision_id, rev, inv=None, config=None):

520

529

"""Add rev to the revision store as revision_id.

521

530

756

765

result['size'] = t

757

766

return result

758

767

768

def find_branches(self, using=False):

769

"""Find branches underneath this repository.

770

771

This will include branches inside other branches.

772

773

:param using: If True, list only branches using this repository.

774

"""

775

if using and not self.is_shared():

776

try:

777

return [self.bzrdir.open_branch()]

778

except errors.NotBranchError:

779

return []

780

class Evaluator(object):

781

782

def __init__(self):

783

self.first_call = True

784

785

def __call__(self, bzrdir):

786

# On the first call, the parameter is always the bzrdir

787

# containing the current repo.

788

if not self.first_call:

789

try:

790

repository = bzrdir.open_repository()

791

except errors.NoRepositoryPresent:

792

pass

793

else:

794

return False, (None, repository)

795

self.first_call = False

796

try:

797

value = (bzrdir.open_branch(), None)

798

except errors.NotBranchError:

799

value = (None, None)

800

return True, value

801

802

branches = []

803

for branch, repository in bzrdir.BzrDir.find_bzrdirs(

804

self.bzrdir.root_transport, evaluate=Evaluator()):

805

if branch is not None:

806

branches.append(branch)

807

if not using and repository is not None:

808

branches.extend(repository.find_branches())

809

return branches

810

759

811

def get_data_stream(self, revision_ids):

760

812

raise NotImplementedError(self.get_data_stream)

761

813

814

def get_data_stream_for_search(self, search_result):

815

"""Get a data stream that can be inserted to a repository.

816

817

:param search_result: A bzrlib.graph.SearchResult selecting the

818

revisions to get.

819

:return: A data stream that can be inserted into a repository using

820

insert_data_stream.

821

"""

822

raise NotImplementedError(self.get_data_stream_for_search)

823

762

824

def insert_data_stream(self, stream):

763

825

"""XXX What does this really do?

764

826

779

841

knit = self._revision_store.get_signature_file(

780

842

self.get_transaction())

781

843

else:

782

raise RepositoryDataStreamError(

844

raise errors.RepositoryDataStreamError(

783

845

"Unrecognised data stream key '%s'" % (item_key,))

784

846

decoded_list = bencode.bdecode(bytes)

785

847

format = decoded_list.pop(0)

788

850

for version, options, parents, some_bytes in decoded_list:

789

851

data_list.append((version, options, len(some_bytes), parents))

790

852

knit_bytes += some_bytes

853

buffer = StringIO(knit_bytes)

854

def reader_func(count):

855

if count is None:

856

return buffer.read()

857

else:

858

return buffer.read(count)

791

859

knit.insert_data_stream(

792

(format, data_list, StringIO(knit_bytes).read))

793

794

@needs_read_lock

795

def missing_revision_ids(self, other, revision_id=None):

796

"""Return the revision ids that other has that this does not.

797

798

These are returned in topological order.

799

800

revision_id: only return revision ids included by revision_id.

801

"""

802

return InterRepository.get(other, self).missing_revision_ids(revision_id)

860

(format, data_list, reader_func))

861

862

@needs_read_lock

863

def search_missing_revision_ids(self, other, revision_id=None, find_ghosts=True):

864

"""Return the revision ids that other has that this does not.

865

866

These are returned in topological order.

867

868

revision_id: only return revision ids included by revision_id.

869

"""

870

return InterRepository.get(other, self).search_missing_revision_ids(

871

revision_id, find_ghosts)

872

873

@deprecated_method(symbol_versioning.one_two)

874

@needs_read_lock

875

def missing_revision_ids(self, other, revision_id=None, find_ghosts=True):

876

"""Return the revision ids that other has that this does not.

877

878

These are returned in topological order.

879

880

revision_id: only return revision ids included by revision_id.

881

"""

882

keys = self.search_missing_revision_ids(

883

other, revision_id, find_ghosts).get_keys()

884

other.lock_read()

885

try:

886

parents = other.get_graph().get_parent_map(keys)

887

finally:

888

other.unlock()

889

return tsort.topo_sort(parents)

803

890

804

891

@staticmethod

805

892

def open(base):

965

1052

@needs_read_lock

966

1053

def has_revision(self, revision_id):

967

1054

"""True if this repository has a copy of the revision."""

968

if 'evil' in debug.debug_flags:

969

mutter_callsite(3, "has_revision is a LBYL symptom.")

1055

return revision_id in self.has_revisions((revision_id,))

1056

1057

def has_revisions(self, revision_ids):

1058

"""Probe to find out the presence of multiple revisions.

1059

1060

:param revision_ids: An iterable of revision_ids.

1061

:return: A set of the revision_ids that were present.

1062

"""

1063

raise NotImplementedError(self.has_revisions)

1064

970

1065

return self._revision_store.has_revision_id(revision_id,

971

1066

self.get_transaction())

972

1067

1051

1146

@needs_write_lock

1052

1147

def store_revision_signature(self, gpg_strategy, plaintext, revision_id):

1053

1148

signature = gpg_strategy.sign(plaintext)

1149

self.add_signature_text(revision_id, signature)

1150

1151

@needs_write_lock

1152

def add_signature_text(self, revision_id, signature):

1054

1153

self._revision_store.add_revision_signature_text(revision_id,

1055

1154

signature,

1056

1155

self.get_transaction())

1057

1156

1058

def _find_file_ids_from_xml_inventory_lines(self, line_iterator,

1059

revision_ids):

1060

"""Helper routine for fileids_altered_by_revision_ids.

1157

def find_text_key_references(self):

1158

"""Find the text key references within the repository.

1159

1160

:return: a dictionary mapping (file_id, revision_id) tuples to altered file-ids to an iterable of

1161

revision_ids. Each altered file-ids has the exact revision_ids that

1162

altered it listed explicitly.

1163

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

1164

to whether they were referred to by the inventory of the

1165

revision_id that they contain. The inventory texts from all present

1166

revision ids are assessed to generate this report.

1167

"""

1168

revision_ids = self.all_revision_ids()

1169

w = self.get_inventory_weave()

1170

pb = ui.ui_factory.nested_progress_bar()

1171

try:

1172

return self._find_text_key_references_from_xml_inventory_lines(

1173

w.iter_lines_added_or_present_in_versions(revision_ids, pb=pb))

1174

finally:

1175

pb.finished()

1176

1177

def _find_text_key_references_from_xml_inventory_lines(self,

1178

line_iterator):

1179

"""Core routine for extracting references to texts from inventories.

1061

1180

1062

1181

This performs the translation of xml lines to revision ids.

1063

1182

1064

1183

:param line_iterator: An iterator of lines, origin_version_id

1065

:param revision_ids: The revision ids to filter for. This should be a

1066

set or other type which supports efficient __contains__ lookups, as

1067

the revision id from each parsed line will be looked up in the

1068

revision_ids filter.

1069

:return: a dictionary mapping altered file-ids to an iterable of

1070

revision_ids. Each altered file-ids has the exact revision_ids that

1071

altered it listed explicitly.

1184

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

1185

to whether they were referred to by the inventory of the

1186

revision_id that they contain. Note that if that revision_id was

1187

not part of the line_iterator's output then False will be given -

1188

even though it may actually refer to that key.

1072

1189

"""

1190

if not self._serializer.support_altered_by_hack:

1191

raise AssertionError(

1192

"_find_text_key_references_from_xml_inventory_lines only "

1193

"supported for branches which store inventory as unnested xml"

1194

", not on %r" % self)

1073

1195

result = {}

1074

1196

1075

1197

# this code needs to read every new line in every inventory for the

1115

1237

unescape_revid_cache[revision_id] = unescaped

1116

1238

revision_id = unescaped

1117

1239

1240

# Note that unconditionally unescaping means that we deserialise

1241

# every fileid, which for general 'pull' is not great, but we don't

1242

# really want to have some many fulltexts that this matters anyway.

1243

# RBC 20071114.

1244

try:

1245

file_id = unescape_fileid_cache[file_id]

1246

except KeyError:

1247

unescaped = unescape(file_id)

1248

unescape_fileid_cache[file_id] = unescaped

1249

file_id = unescaped

1250

1251

key = (file_id, revision_id)

1252

setdefault(key, False)

1253

if revision_id == version_id:

1254

result[key] = True

1255

return result

1256

1257

def _find_file_ids_from_xml_inventory_lines(self, line_iterator,

1258

revision_ids):

1259

"""Helper routine for fileids_altered_by_revision_ids.

1260

1261

This performs the translation of xml lines to revision ids.

1262

1263

:param line_iterator: An iterator of lines, origin_version_id

1264

:param revision_ids: The revision ids to filter for. This should be a

1265

set or other type which supports efficient __contains__ lookups, as

1266

the revision id from each parsed line will be looked up in the

1267

revision_ids filter.

1268

:return: a dictionary mapping altered file-ids to an iterable of

1269

revision_ids. Each altered file-ids has the exact revision_ids that

1270

altered it listed explicitly.

1271

"""

1272

result = {}

1273

setdefault = result.setdefault

1274

for file_id, revision_id in \

1275

self._find_text_key_references_from_xml_inventory_lines(

1276

line_iterator).iterkeys():

1118

1277

# once data is all ensured-consistent; then this is

1119

1278

# if revision_id == version_id

1120

1279

if revision_id in revision_ids:

1121

try:

1122

file_id = unescape_fileid_cache[file_id]

1123

except KeyError:

1124

unescaped = unescape(file_id)

1125

unescape_fileid_cache[file_id] = unescaped

1126

file_id = unescaped

1127

1280

setdefault(file_id, set()).add(revision_id)

1128

1281

return result

1129

1282

1135

1288

revision_ids. Each altered file-ids has the exact revision_ids that

1136

1289

altered it listed explicitly.

1137

1290

"""

1138

assert self._serializer.support_altered_by_hack, \

1139

("fileids_altered_by_revision_ids only supported for branches "

1140

"which store inventory as unnested xml, not on %r" % self)

1141

1291

selected_revision_ids = set(revision_ids)

1142

1292

w = self.get_inventory_weave()

1143

1293

pb = ui.ui_factory.nested_progress_bar()

1176

1326

raise errors.NoSuchIdInRepository(self, file_id)

1177

1327

yield callable_data, weave.get_lines(revision_id)

1178

1328

1329

def _generate_text_key_index(self, text_key_references=None,

1330

ancestors=None):

1331

"""Generate a new text key index for the repository.

1332

1333

This is an expensive function that will take considerable time to run.

1334

1335

:return: A dict mapping text keys ((file_id, revision_id) tuples) to a

1336

list of parents, also text keys. When a given key has no parents,

1337

the parents list will be [NULL_REVISION].

1338

"""

1339

# All revisions, to find inventory parents.

1340

if ancestors is None:

1341

revision_graph = self.get_revision_graph_with_ghosts()

1342

ancestors = revision_graph.get_ancestors()

1343

if text_key_references is None:

1344

text_key_references = self.find_text_key_references()

1345

pb = ui.ui_factory.nested_progress_bar()

1346

try:

1347

return self._do_generate_text_key_index(ancestors,

1348

text_key_references, pb)

1349

finally:

1350

pb.finished()

1351

1352

def _do_generate_text_key_index(self, ancestors, text_key_references, pb):

1353

"""Helper for _generate_text_key_index to avoid deep nesting."""

1354

revision_order = tsort.topo_sort(ancestors)

1355

invalid_keys = set()

1356

revision_keys = {}

1357

for revision_id in revision_order:

1358

revision_keys[revision_id] = set()

1359

text_count = len(text_key_references)

1360

# a cache of the text keys to allow reuse; costs a dict of all the

1361

# keys, but saves a 2-tuple for every child of a given key.

1362

text_key_cache = {}

1363

for text_key, valid in text_key_references.iteritems():

1364

if not valid:

1365

invalid_keys.add(text_key)

1366

else:

1367

revision_keys[text_key[1]].add(text_key)

1368

text_key_cache[text_key] = text_key

1369

del text_key_references

1370

text_index = {}

1371

text_graph = graph.Graph(graph.DictParentsProvider(text_index))

1372

NULL_REVISION = _mod_revision.NULL_REVISION

1373

# Set a cache with a size of 10 - this suffices for bzr.dev but may be

1374

# too small for large or very branchy trees. However, for 55K path

1375

# trees, it would be easy to use too much memory trivially. Ideally we

1376

# could gauge this by looking at available real memory etc, but this is

1377

# always a tricky proposition.

1378

inventory_cache = lru_cache.LRUCache(10)

1379

batch_size = 10 # should be ~150MB on a 55K path tree

1380

batch_count = len(revision_order) / batch_size + 1

1381

processed_texts = 0

1382

pb.update("Calculating text parents.", processed_texts, text_count)

1383

for offset in xrange(batch_count):

1384

to_query = revision_order[offset * batch_size:(offset + 1) *

1385

batch_size]

1386

if not to_query:

1387

break

1388

for rev_tree in self.revision_trees(to_query):

1389

revision_id = rev_tree.get_revision_id()

1390

parent_ids = ancestors[revision_id]

1391

for text_key in revision_keys[revision_id]:

1392

pb.update("Calculating text parents.", processed_texts)

1393

processed_texts += 1

1394

candidate_parents = []

1395

for parent_id in parent_ids:

1396

parent_text_key = (text_key[0], parent_id)

1397

try:

1398

check_parent = parent_text_key not in \

1399

revision_keys[parent_id]

1400

except KeyError:

1401

# the parent parent_id is a ghost:

1402

check_parent = False

1403

# truncate the derived graph against this ghost.

1404

parent_text_key = None

1405

if check_parent:

1406

# look at the parent commit details inventories to

1407

# determine possible candidates in the per file graph.

1408

# TODO: cache here.

1409

try:

1410

inv = inventory_cache[parent_id]

1411

except KeyError:

1412

inv = self.revision_tree(parent_id).inventory

1413

inventory_cache[parent_id] = inv

1414

parent_entry = inv._byid.get(text_key[0], None)

1415

if parent_entry is not None:

1416

parent_text_key = (

1417

text_key[0], parent_entry.revision)

1418

else:

1419

parent_text_key = None

1420

if parent_text_key is not None:

1421

candidate_parents.append(

1422

text_key_cache[parent_text_key])

1423

parent_heads = text_graph.heads(candidate_parents)

1424

new_parents = list(parent_heads)

1425

new_parents.sort(key=lambda x:candidate_parents.index(x))

1426

if new_parents == []:

1427

new_parents = [NULL_REVISION]

1428

text_index[text_key] = new_parents

1429

1430

for text_key in invalid_keys:

1431

text_index[text_key] = [NULL_REVISION]

1432

return text_index

1433

1179

1434

def item_keys_introduced_by(self, revision_ids, _files_pb=None):

1180

1435

"""Get an iterable listing the keys of all the data introduced by a set

1181

1436

of revision IDs.

1236

1491

1237

1492

@needs_read_lock

1238

1493

def get_inventory(self, revision_id):

1239

"""Get Inventory object by hash."""

1240

return self.deserialise_inventory(

1241

revision_id, self.get_inventory_xml(revision_id))

1494

"""Get Inventory object by revision id."""

1495

return self.iter_inventories([revision_id]).next()

1496

1497

def iter_inventories(self, revision_ids):

1498

"""Get many inventories by revision_ids.

1499

1500

This will buffer some or all of the texts used in constructing the

1501

inventories in memory, but will only parse a single inventory at a

1502

time.

1503

1504

:return: An iterator of inventories.

1505

"""

1506

assert None not in revision_ids

1507

assert _mod_revision.NULL_REVISION not in revision_ids

1508

return self._iter_inventories(revision_ids)

1509

1510

def _iter_inventories(self, revision_ids):

1511

"""single-document based inventory iteration."""

1512

texts = self.get_inventory_weave().get_texts(revision_ids)

1513

for text, revision_id in zip(texts, revision_ids):

1514

yield self.deserialise_inventory(revision_id, text)

1242

1515

1243

1516

def deserialise_inventory(self, revision_id, xml):

1244

1517

"""Transform the xml into an inventory object.

1246

1519

:param revision_id: The expected revision id of the inventory.

1247

1520

:param xml: A serialised inventory.

1248

1521

"""

1249

return self._serializer.read_inventory_from_string(xml, revision_id)

1522

result = self._serializer.read_inventory_from_string(xml, revision_id)

1523

if result.revision_id != revision_id:

1524

raise AssertionError('revision id mismatch %s != %s' % (

1525

result.revision_id, revision_id))

1526

return result

1250

1527

1251

1528

def serialise_inventory(self, inv):

1252

1529

return self._serializer.write_inventory_to_string(inv)

1412

1689

"""Return Tree for a revision on this branch.

1413

1690

1414

1691

`revision_id` may not be None or 'null:'"""

1415

assert None not in revision_ids

1416

assert _mod_revision.NULL_REVISION not in revision_ids

1417

texts = self.get_inventory_weave().get_texts(revision_ids)

1418

for text, revision_id in zip(texts, revision_ids):

1419

inv = self.deserialise_inventory(revision_id, text)

1420

yield RevisionTree(self, inv, revision_id)

1692

inventories = self.iter_inventories(revision_ids)

1693

for inv in inventories:

1694

yield RevisionTree(self, inv, inv.revision_id)

1421

1695

1422

1696

@needs_read_lock

1423

1697

def get_ancestry(self, revision_id, topo_sorted=True):

1472

1746

def revision_parents(self, revision_id):

1473

1747

return self.get_inventory_weave().parent_names(revision_id)

1474

1748

1749

@deprecated_method(symbol_versioning.one_one)

1475

1750

def get_parents(self, revision_ids):

1476

1751

"""See StackedParentsProvider.get_parents"""

1477

parents_list = []

1478

for revision_id in revision_ids:

1752

parent_map = self.get_parent_map(revision_ids)

1753

return [parent_map.get(r, None) for r in revision_ids]

1754

1755

def get_parent_map(self, keys):

1756

"""See graph._StackedParentsProvider.get_parent_map"""

1757

parent_map = {}

1758

for revision_id in keys:

1479

1759

if revision_id == _mod_revision.NULL_REVISION:

1480

parents = []

1760

parent_map[revision_id] = ()

1481

1761

else:

1482

1762

try:

1483

parents = self.get_revision(revision_id).parent_ids

1763

parent_id_list = self.get_revision(revision_id).parent_ids

1484

1764

except errors.NoSuchRevision:

1485

parents = None

1765

pass

1486

1766

else:

1487

if len(parents) == 0:

1488

parents = [_mod_revision.NULL_REVISION]

1489

parents_list.append(parents)

1490

return parents_list

1767

if len(parent_id_list) == 0:

1768

parent_ids = (_mod_revision.NULL_REVISION,)

1769

else:

1770

parent_ids = tuple(parent_id_list)

1771

parent_map[revision_id] = parent_ids

1772

return parent_map

1491

1773

1492

1774

def _make_parents_provider(self):

1493

1775

return self

1496

1778

"""Return the graph walker for this repository format"""

1497

1779

parents_provider = self._make_parents_provider()

1498

1780

if (other_repository is not None and

1499

other_repository.bzrdir.transport.base !=

1500

self.bzrdir.transport.base):

1781

not self.has_same_location(other_repository)):

1501

1782

parents_provider = graph._StackedParentsProvider(

1502

1783

[parents_provider, other_repository._make_parents_provider()])

1503

1784

return graph.Graph(parents_provider)

1504

1785

1505

def get_versioned_file_checker(self, revisions, revision_versions_cache):

1506

return VersionedFileChecker(revisions, revision_versions_cache, self)

1786

def _get_versioned_file_checker(self):

1787

"""Return an object suitable for checking versioned files."""

1788

return _VersionedFileChecker(self)

1789

1790

def revision_ids_to_search_result(self, result_set):

1791

"""Convert a set of revision ids to a graph SearchResult."""

1792

result_parents = set()

1793

for parents in self.get_graph().get_parent_map(

1794

result_set).itervalues():

1795

result_parents.update(parents)

1796

included_keys = result_set.intersection(result_parents)

1797

start_keys = result_set.difference(included_keys)

1798

exclude_keys = result_parents.difference(result_set)

1799

result = graph.SearchResult(start_keys, exclude_keys,

1800

len(result_set), result_set)

1801

return result

1507

1802

1508

1803

@needs_write_lock

1509

1804

def set_make_working_trees(self, new_value):

1591

1886

depend on the revision index being consistent.

1592

1887

"""

1593

1888

raise NotImplementedError(self.revision_graph_can_have_wrong_parents)

1594

1889

1890

1595

1891

# remove these delegates a while after bzr 0.15

1596

1892

def __make_delegated(name, from_module):

1597

1893

def _deprecated_repository_forwarder():

1628

1924

1629

1925

def install_revision(repository, rev, revision_tree):

1630

1926

"""Install all revision data into a repository."""

1927

install_revisions(repository, [(rev, revision_tree, None)])

1928

1929

1930

def install_revisions(repository, iterable, num_revisions=None, pb=None):

1931

"""Install all revision data into a repository.

1932

1933

Accepts an iterable of revision, tree, signature tuples. The signature

1934

may be None.

1935

"""

1631

1936

repository.start_write_group()

1632

1937

try:

1633

_install_revision(repository, rev, revision_tree)

1938

for n, (revision, revision_tree, signature) in enumerate(iterable):

1939

_install_revision(repository, revision, revision_tree, signature)

1940

if pb is not None:

1941

pb.update('Transferring revisions', n + 1, num_revisions)

1634

1942

except:

1635

1943

repository.abort_write_group()

1636

1944

raise

1638

1946

repository.commit_write_group()

1639

1947

1640

1948

1641

def _install_revision(repository, rev, revision_tree):

1949

def _install_revision(repository, rev, revision_tree, signature):

1642

1950

"""Install all revision data into a repository."""

1643

1951

present_parents = []

1644

1952

parent_trees = {}

1683

1991

repository.add_inventory(rev.revision_id, inv, present_parents)

1684

1992

except errors.RevisionAlreadyPresent:

1685

1993

pass

1994

if signature is not None:

1995

repository.add_signature_text(rev.revision_id, signature)

1686

1996

repository.add_revision(rev.revision_id, rev, inv)

1687

1997

1688

1998

1774

2084

_matchingbzrdir - the bzrdir format that the repository format was

1775

2085

originally written to work with. This can be used if manually

1776

2086

constructing a bzrdir and repository, or more commonly for test suite

1777

parameterisation.

2087

parameterization.

1778

2088

"""

1779

2089

1780

2090

# Set to True or False in derived classes. True indicates that the format

1968

2278

'RepositoryFormat7'

1969

2279

)

1970

2280

1971

# KEEP in sync with bzrdir.format_registry default, which controls the overall

1972

# default control directory format

1973

2281

format_registry.register_lazy(

1974

2282

'Bazaar-NG Knit Repository Format 1',

1975

2283

'bzrlib.repofmt.knitrepo',

1976

2284

'RepositoryFormatKnit1',

1977

2285

)

1978

format_registry.default_key = 'Bazaar-NG Knit Repository Format 1'

1979

2286

1980

2287

format_registry.register_lazy(

1981

2288

'Bazaar Knit Repository Format 3 (bzr 0.15)\n',

1983

2290

'RepositoryFormatKnit3',

1984

2291

)

1985

2292

2293

format_registry.register_lazy(

2294

'Bazaar Knit Repository Format 4 (bzr 1.0)\n',

2295

'bzrlib.repofmt.knitrepo',

2296

'RepositoryFormatKnit4',

2297

)

2298

1986

2299

# Pack-based formats. There is one format for pre-subtrees, and one for

1987

2300

# post-subtrees to allow ease of testing.

1988

2301

# NOTE: These are experimental in 0.92.

1996

2309

'bzrlib.repofmt.pack_repo',

1997

2310

'RepositoryFormatKnitPack3',

1998

2311

)

2312

format_registry.register_lazy(

2313

'Bazaar pack repository format 1 with rich root (needs bzr 1.0)\n',

2314

'bzrlib.repofmt.pack_repo',

2315

'RepositoryFormatKnitPack4',

2316

)

1999

2317

2000

2318

2001

2319

class InterRepository(InterObject):

2030

2348

(copied, failures).

2031

2349

"""

2032

2350

raise NotImplementedError(self.fetch)

2351

2352

def _walk_to_common_revisions(self, revision_ids):

2353

"""Walk out from revision_ids in source to revisions target has.

2354

2355

:param revision_ids: The start point for the search.

2356

:return: A set of revision ids.

2357

"""

2358

graph = self.source.get_graph()

2359

missing_revs = set()

2360

# ensure we don't pay silly lookup costs.

2361

revision_ids = frozenset(revision_ids)

2362

searcher = graph._make_breadth_first_searcher(revision_ids)

2363

null_set = frozenset([_mod_revision.NULL_REVISION])

2364

while True:

2365

try:

2366

next_revs, ghosts = searcher.next_with_ghosts()

2367

except StopIteration:

2368

break

2369

if revision_ids.intersection(ghosts):

2370

absent_ids = set(revision_ids.intersection(ghosts))

2371

# If all absent_ids are present in target, no error is needed.

2372

absent_ids.difference_update(

2373

self.target.has_revisions(absent_ids))

2374

if absent_ids:

2375

raise errors.NoSuchRevision(self.source, absent_ids.pop())

2376

# we don't care about other ghosts as we can't fetch them and

2377

# haven't been asked to.

2378

next_revs = set(next_revs)

2379

# we always have NULL_REVISION present.

2380

have_revs = self.target.has_revisions(next_revs).union(null_set)

2381

missing_revs.update(next_revs - have_revs)

2382

searcher.stop_searching_any(have_revs)

2383

return searcher.get_result()

2033

2384

2385

@deprecated_method(symbol_versioning.one_two)

2034

2386

@needs_read_lock

2035

def missing_revision_ids(self, revision_id=None):

2387

def missing_revision_ids(self, revision_id=None, find_ghosts=True):

2036

2388

"""Return the revision ids that source has that target does not.

2037

2389

2038

2390

These are returned in topological order.

2039

2391

2040

2392

:param revision_id: only return revision ids included by this

2041

2393

revision_id.

2042

"""

2394

:param find_ghosts: If True find missing revisions in deep history

2395

rather than just finding the surface difference.

2396

"""

2397

return list(self.search_missing_revision_ids(

2398

revision_id, find_ghosts).get_keys())

2399

2400

@needs_read_lock

2401

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

2402

"""Return the revision ids that source has that target does not.

2403

2404

:param revision_id: only return revision ids included by this

2405

revision_id.

2406

:param find_ghosts: If True find missing revisions in deep history

2407

rather than just finding the surface difference.

2408

:return: A bzrlib.graph.SearchResult.

2409

"""

2410

# stop searching at found target revisions.

2411

if not find_ghosts and revision_id is not None:

2412

return self._walk_to_common_revisions([revision_id])

2043

2413

# generic, possibly worst case, slow code path.

2044

2414

target_ids = set(self.target.all_revision_ids())

2045

2415

if revision_id is not None:

2049

2419

else:

2050

2420

source_ids = self.source.all_revision_ids()

2051

2421

result_set = set(source_ids).difference(target_ids)

2052

# this may look like a no-op: its not. It preserves the ordering

2053

# other_ids had while only returning the members from other_ids

2054

# that we've decided we need.

2055

return [rev_id for rev_id in source_ids if rev_id in result_set]

2422

return self.source.revision_ids_to_search_result(result_set)

2056

2423

2057

2424

@staticmethod

2058

2425

def _same_model(source, target):

2117

2484

f = GenericRepoFetcher(to_repository=self.target,

2118

2485

from_repository=self.source,

2119

2486

last_revision=revision_id,

2120

pb=pb)

2487

pb=pb, find_ghosts=find_ghosts)

2121

2488

return f.count_copied, f.failed_revisions

2122

2489

2123

2490

2195

2562

f = GenericRepoFetcher(to_repository=self.target,

2196

2563

from_repository=self.source,

2197

2564

last_revision=revision_id,

2198

pb=pb)

2565

pb=pb, find_ghosts=find_ghosts)

2199

2566

return f.count_copied, f.failed_revisions

2200

2567

2201

2568

@needs_read_lock

2202

def missing_revision_ids(self, revision_id=None):

2569

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

2203

2570

"""See InterRepository.missing_revision_ids()."""

2204

2571

# we want all revisions to satisfy revision_id in source.

2205

2572

# but we don't want to stat every file here and there.

2225

2592

# we do not have a revision as that would be pointless.

2226

2593

target_ids = set(self.target._all_possible_ids())

2227

2594

possibly_present_revisions = target_ids.intersection(source_ids_set)

2228

actually_present_revisions = set(self.target._eliminate_revisions_not_present(possibly_present_revisions))

2595

actually_present_revisions = set(

2596

self.target._eliminate_revisions_not_present(possibly_present_revisions))

2229

2597

required_revisions = source_ids_set.difference(actually_present_revisions)

2230

required_topo_revisions = [rev_id for rev_id in source_ids if rev_id in required_revisions]

2231

2598

if revision_id is not None:

2232

2599

# we used get_ancestry to determine source_ids then we are assured all

2233

2600

# revisions referenced are present as they are installed in topological order.

2234

2601

# and the tip revision was validated by get_ancestry.

2235

return required_topo_revisions

2602

result_set = required_revisions

2236

2603

else:

2237

2604

# if we just grabbed the possibly available ids, then

2238

2605

# we only have an estimate of whats available and need to validate

2239

2606

# that against the revision records.

2240

return self.source._eliminate_revisions_not_present(required_topo_revisions)

2607

result_set = set(

2608

self.source._eliminate_revisions_not_present(required_revisions))

2609

return self.source.revision_ids_to_search_result(result_set)

2241

2610

2242

2611

2243

2612

class InterKnitRepo(InterSameDataRepository):

2273

2642

f = KnitRepoFetcher(to_repository=self.target,

2274

2643

from_repository=self.source,

2275

2644

last_revision=revision_id,

2276

pb=pb)

2645

pb=pb, find_ghosts=find_ghosts)

2277

2646

return f.count_copied, f.failed_revisions

2278

2647

2279

2648

@needs_read_lock

2280

def missing_revision_ids(self, revision_id=None):

2649

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

2281

2650

"""See InterRepository.missing_revision_ids()."""

2282

2651

if revision_id is not None:

2283

2652

source_ids = self.source.get_ancestry(revision_id)

2292

2661

# we do not have a revision as that would be pointless.

2293

2662

target_ids = set(self.target.all_revision_ids())

2294

2663

possibly_present_revisions = target_ids.intersection(source_ids_set)

2295

actually_present_revisions = set(self.target._eliminate_revisions_not_present(possibly_present_revisions))

2664

actually_present_revisions = set(

2665

self.target._eliminate_revisions_not_present(possibly_present_revisions))

2296

2666

required_revisions = source_ids_set.difference(actually_present_revisions)

2297

required_topo_revisions = [rev_id for rev_id in source_ids if rev_id in required_revisions]

2298

2667

if revision_id is not None:

2299

2668

# we used get_ancestry to determine source_ids then we are assured all

2300

2669

# revisions referenced are present as they are installed in topological order.

2301

2670

# and the tip revision was validated by get_ancestry.

2302

return required_topo_revisions

2671

result_set = required_revisions

2303

2672

else:

2304

2673

# if we just grabbed the possibly available ids, then

2305

2674

# we only have an estimate of whats available and need to validate

2306

2675

# that against the revision records.

2307

return self.source._eliminate_revisions_not_present(required_topo_revisions)

2676

result_set = set(

2677

self.source._eliminate_revisions_not_present(required_revisions))

2678

return self.source.revision_ids_to_search_result(result_set)

2308

2679

2309

2680

2310

2681

class InterPackRepo(InterSameDataRepository):

2354

2725

# sensibly detect 'new revisions' without doing a full index scan.

2355

2726

elif _mod_revision.is_null(revision_id):

2356

2727

# nothing to do:

2357

return

2728

return (0, [])

2358

2729

else:

2359

2730

try:

2360

revision_ids = self.missing_revision_ids(revision_id,

2361

find_ghosts=find_ghosts)

2731

revision_ids = self.search_missing_revision_ids(revision_id,

2732

find_ghosts=find_ghosts).get_keys()

2362

2733

except errors.NoSuchRevision:

2363

2734

raise errors.InstallFailed([revision_id])

2364

2735

packs = self.source._pack_collection.all_packs()

2370

2741

# a pack creation, but for now it is simpler to think about as

2371

2742

# 'upload data, then repack if needed'.

2372

2743

self.target._pack_collection.autopack()

2373

return pack.get_revision_count()

2744

return (pack.get_revision_count(), [])

2374

2745

else:

2375

return 0

2746

return (0, [])

2376

2747

2377

2748

@needs_read_lock

2378

def missing_revision_ids(self, revision_id=None, find_ghosts=True):

2749

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

2379

2750

"""See InterRepository.missing_revision_ids().

2380

2751

2381

:param find_ghosts: Find ghosts throughough the ancestry of

2752

:param find_ghosts: Find ghosts throughout the ancestry of

2382

2753

revision_id.

2383

2754

"""

2384

2755

if not find_ghosts and revision_id is not None:

2385

graph = self.source.get_graph()

2386

missing_revs = set()

2387

searcher = graph._make_breadth_first_searcher([revision_id])

2388

target_index = \

2389

self.target._pack_collection.revision_index.combined_index

2390

null_set = frozenset([_mod_revision.NULL_REVISION])

2391

while True:

2392

try:

2393

next_revs = set(searcher.next())

2394

except StopIteration:

2395

break

2396

next_revs.difference_update(null_set)

2397

target_keys = [(key,) for key in next_revs]

2398

have_revs = frozenset(node[1][0] for node in

2399

target_index.iter_entries(target_keys))

2400

missing_revs.update(next_revs - have_revs)

2401

searcher.stop_searching_any(have_revs)

2402

return missing_revs

2756

return self._walk_to_common_revisions([revision_id])

2403

2757

elif revision_id is not None:

2404

2758

source_ids = self.source.get_ancestry(revision_id)

2405

2759

assert source_ids[0] is None

2411

2765

# have in target, but don't try to check for existence where we know

2412

2766

# we do not have a revision as that would be pointless.

2413

2767

target_ids = set(self.target.all_revision_ids())

2414

return [r for r in source_ids if (r not in target_ids)]

2768

result_set = set(source_ids).difference(target_ids)

2769

return self.source.revision_ids_to_search_result(result_set)

2415

2770

2416

2771

2417

2772

class InterModel1and2(InterRepository):

2434

2789

f = Model1toKnit2Fetcher(to_repository=self.target,

2435

2790

from_repository=self.source,

2436

2791

last_revision=revision_id,

2437

pb=pb)

2792

pb=pb, find_ghosts=find_ghosts)

2438

2793

return f.count_copied, f.failed_revisions

2439

2794

2440

2795

@needs_write_lock

2491

2846

f = Knit1to2Fetcher(to_repository=self.target,

2492

2847

from_repository=self.source,

2493

2848

last_revision=revision_id,

2494

pb=pb)

2849

pb=pb, find_ghosts=find_ghosts)

2495

2850

return f.count_copied, f.failed_revisions

2496

2851

2497

2852

2853

class InterDifferingSerializer(InterKnitRepo):

2854

2855

@classmethod

2856

def _get_repo_format_to_test(self):

2857

return None

2858

2859

@staticmethod

2860

def is_compatible(source, target):

2861

"""Be compatible with Knit2 source and Knit3 target"""

2862

if source.supports_rich_root() != target.supports_rich_root():

2863

return False

2864

# Ideally, we'd support fetching if the source had no tree references

2865

# even if it supported them...

2866

if (getattr(source, '_format.supports_tree_reference', False) and

2867

not getattr(target, '_format.supports_tree_reference', False)):

2868

return False

2869

return True

2870

2871

@needs_write_lock

2872

def fetch(self, revision_id=None, pb=None, find_ghosts=False):

2873

"""See InterRepository.fetch()."""

2874

revision_ids = self.target.search_missing_revision_ids(self.source,

2875

revision_id, find_ghosts=find_ghosts).get_keys()

2876

revision_ids = tsort.topo_sort(

2877

self.source.get_graph().get_parent_map(revision_ids))

2878

def revisions_iterator():

2879

for current_revision_id in revision_ids:

2880

revision = self.source.get_revision(current_revision_id)

2881

tree = self.source.revision_tree(current_revision_id)

2882

try:

2883

signature = self.source.get_signature_text(

2884

current_revision_id)

2885

except errors.NoSuchRevision:

2886

signature = None

2887

yield revision, tree, signature

2888

if pb is None:

2889

my_pb = ui.ui_factory.nested_progress_bar()

2890

pb = my_pb

2891

else:

2892

my_pb = None

2893

try:

2894

install_revisions(self.target, revisions_iterator(),

2895

len(revision_ids), pb)

2896

finally:

2897

if my_pb is not None:

2898

my_pb.finished()

2899

return len(revision_ids), 0

2900

2901

2498

2902

class InterRemoteToOther(InterRepository):

2499

2903

2500

2904

def __init__(self, source, target):

2505

2909

def is_compatible(source, target):

2506

2910

if not isinstance(source, remote.RemoteRepository):

2507

2911

return False

2912

# Is source's model compatible with target's model?

2508

2913

source._ensure_real()

2509

2914

real_source = source._real_repository

2510

# Is source's model compatible with target's model, and are they the

2511

# same format? Currently we can only optimise fetching from an

2512

# identical model & format repo.

2513

2915

assert not isinstance(real_source, remote.RemoteRepository), (

2514

2916

"We don't support remote repos backed by remote repos yet.")

2515

return real_source._format == target._format

2917

return InterRepository._same_model(real_source, target)

2516

2918

2517

2919

@needs_write_lock

2518

2920

def fetch(self, revision_id=None, pb=None, find_ghosts=False):

2525

2927

f = RemoteToOtherFetcher(to_repository=self.target,

2526

2928

from_repository=self.source,

2527

2929

last_revision=revision_id,

2528

pb=pb)

2930

pb=pb, find_ghosts=find_ghosts)

2529

2931

return f.count_copied, f.failed_revisions

2530

2932

2531

2933

@classmethod

2557

2959

2558

2960

def fetch(self, revision_id=None, pb=None, find_ghosts=False):

2559

2961

self._ensure_real_inter()

2560

self._real_inter.fetch(revision_id=revision_id, pb=pb)

2962

self._real_inter.fetch(revision_id=revision_id, pb=pb,

2963

find_ghosts=find_ghosts)

2561

2964

2562

2965

@classmethod

2563

2966

def _get_repo_format_to_test(self):

2564

2967

return None

2565

2968

2566

2969

2970

InterRepository.register_optimiser(InterDifferingSerializer)

2567

2971

InterRepository.register_optimiser(InterSameDataRepository)

2568

2972

InterRepository.register_optimiser(InterWeaveRepo)

2569

2973

InterRepository.register_optimiser(InterKnitRepo)

2656

3060

return _unescape_re.sub(_unescaper, data)

2657

3061

2658

3062

2659

class _RevisionTextVersionCache(object):

2660

"""A cache of the versionedfile versions for revision and file-id."""

3063

class _VersionedFileChecker(object):

2661

3064

2662

3065

def __init__(self, repository):

2663

3066

self.repository = repository

2664

self.revision_versions = {}

2665

self.revision_parents = {}

2666

self.repo_graph = self.repository.get_graph()

2667

# XXX: RBC: I haven't tracked down what uses this, but it would be

2668

# better to use the headscache directly I think.

2669

self.heads = graph.HeadsCache(self.repo_graph).heads

2670

2671

def add_revision_text_versions(self, tree):

2672

"""Cache text version data from the supplied revision tree"""

2673

inv_revisions = {}

2674

for path, entry in tree.iter_entries_by_dir():

2675

inv_revisions[entry.file_id] = entry.revision

2676

self.revision_versions[tree.get_revision_id()] = inv_revisions

2677

return inv_revisions

2678

2679

def get_text_version(self, file_id, revision_id):

2680

"""Determine the text version for a given file-id and revision-id"""

2681

try:

2682

inv_revisions = self.revision_versions[revision_id]

2683

except KeyError:

2684

try:

2685

tree = self.repository.revision_tree(revision_id)

2686

except errors.RevisionNotPresent:

2687

self.revision_versions[revision_id] = inv_revisions = {}

2688

else:

2689

inv_revisions = self.add_revision_text_versions(tree)

2690

return inv_revisions.get(file_id)

2691

2692

def prepopulate_revs(self, revision_ids):

2693

# Filter out versions that we don't have an inventory for, so that the

2694

# revision_trees() call won't fail.

2695

inv_weave = self.repository.get_inventory_weave()

2696

revs = [r for r in revision_ids if inv_weave.has_version(r)]

2697

# XXX: this loop is very similar to

2698

# bzrlib.fetch.Inter1and2Helper.iter_rev_trees.

2699

while revs:

2700

mutter('%d revisions left to prepopulate', len(revs))

2701

for tree in self.repository.revision_trees(revs[:100]):

2702

if tree.inventory.revision_id is None:

2703

tree.inventory.revision_id = tree.get_revision_id()

2704

self.add_revision_text_versions(tree)

2705

revs = revs[100:]

2706

2707

def get_parents(self, revision_id):

2708

try:

2709

return self.revision_parents[revision_id]

2710

except KeyError:

2711

parents = self.repository.get_parents([revision_id])[0]

2712

self.revision_parents[revision_id] = parents

2713

return parents

2714

2715

def used_file_versions(self):

2716

"""Return a set of (revision_id, file_id) pairs for each file version

2717

referenced by any inventory cached by this _RevisionTextVersionCache.

2718

2719

If the entire repository has been cached, this can be used to find all

2720

file versions that are actually referenced by inventories. Thus any

2721

other file version is completely unused and can be removed safely.

2722

"""

2723

result = set()

2724

for inventory_summary in self.revision_versions.itervalues():

2725

result.update(inventory_summary.items())

2726

return result

2727

2728

2729

class VersionedFileChecker(object):

2730

2731

def __init__(self, planned_revisions, revision_versions, repository):

2732

self.planned_revisions = planned_revisions

2733

self.revision_versions = revision_versions

2734

self.repository = repository

3067

self.text_index = self.repository._generate_text_key_index()

2735

3068

2736

3069

def calculate_file_version_parents(self, revision_id, file_id):

2737

3070

"""Calculate the correct parents for a file version according to

2738

3071

the inventories.

2739

3072

"""

2740

text_revision = self.revision_versions.get_text_version(

2741

file_id, revision_id)

2742

if text_revision is None:

2743

return None

2744

parents_of_text_revision = self.revision_versions.get_parents(

2745

text_revision)

2746

parents_from_inventories = []

2747

for parent in parents_of_text_revision:

2748

if parent == _mod_revision.NULL_REVISION:

2749

continue

2750

introduced_in = self.revision_versions.get_text_version(file_id,

2751

parent)

2752

if introduced_in is not None:

2753

parents_from_inventories.append(introduced_in)

2754

heads = set(self.revision_versions.heads(parents_from_inventories))

2755

new_parents = []

2756

for parent in parents_from_inventories:

2757

if parent in heads and parent not in new_parents:

2758

new_parents.append(parent)

2759

return tuple(new_parents)

3073

parent_keys = self.text_index[(file_id, revision_id)]

3074

if parent_keys == [_mod_revision.NULL_REVISION]:

3075

return ()

3076

# strip the file_id, for the weave api

3077

return tuple([revision_id for file_id, revision_id in parent_keys])

2760

3078

2761

3079

def check_file_version_parents(self, weave, file_id):

2762

3080

"""Check the parents stored in a versioned file are correct.

2772

3090

file, but not used by the corresponding inventory.

2773

3091

"""

2774

3092

wrong_parents = {}

2775

dangling_file_versions = set()

2776

for num, revision_id in enumerate(self.planned_revisions):

2777

correct_parents = self.calculate_file_version_parents(

2778

revision_id, file_id)

2779

if correct_parents is None:

2780

continue

2781

text_revision = self.revision_versions.get_text_version(

2782

file_id, revision_id)

3093

unused_versions = set()

3094

for num, revision_id in enumerate(weave.versions()):

2783

3095

try:

2784

knit_parents = tuple(weave.get_parents(revision_id))

2785

except errors.RevisionNotPresent:

2786

knit_parents = None

2787

if text_revision != revision_id:

2788

# This file version is not referenced by its corresponding

2789

# inventory!

2790

dangling_file_versions.add((file_id, revision_id))

2791

if correct_parents != knit_parents:

2792

wrong_parents[revision_id] = (knit_parents, correct_parents)

2793

return wrong_parents, dangling_file_versions

3096

correct_parents = self.calculate_file_version_parents(

3097

revision_id, file_id)

3098

except KeyError:

3099

# The version is not part of the used keys.

3100

unused_versions.add(revision_id)

3101

else:

3102

try:

3103

knit_parents = tuple(weave.get_parents(revision_id))

3104

except errors.RevisionNotPresent:

3105

knit_parents = None

3106

if correct_parents != knit_parents:

3107

wrong_parents[revision_id] = (knit_parents, correct_parents)

3108

return wrong_parents, unused_versions

Older »