1
# Copyright (C) 2009-2018 Jelmer Vernooij <jelmer@jelmer.uk>
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11
# GNU General Public License for more details.
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17
"""InterRepository operations."""
19
from __future__ import absolute_import
21
from io import BytesIO
24
from dulwich.errors import (
27
from dulwich.object_store import (
28
ObjectStoreGraphWalker,
30
from dulwich.protocol import (
34
from dulwich.refs import (
38
from dulwich.walk import Walker
40
from ..errors import (
42
FetchLimitUnsupported,
45
NoRoundtrippingSupport,
48
from ..repository import (
52
from ..revision import (
55
from ..sixish import (
70
DetermineWantsRecorder,
72
from .mapping import (
75
from .object_store import (
79
MissingObjectsIterator,
86
from .repository import (
95
from .unpeel_map import (
100
class InterToGitRepository(InterRepository):
101
"""InterRepository that copies into a Git repository."""
103
_matching_repo_format = GitRepositoryFormat()
105
def __init__(self, source, target):
106
super(InterToGitRepository, self).__init__(source, target)
107
self.mapping = self.target.get_mapping()
108
self.source_store = get_object_store(self.source, self.mapping)
111
def _get_repo_format_to_test():
114
def copy_content(self, revision_id=None, pb=None):
115
"""See InterRepository.copy_content."""
116
self.fetch(revision_id, pb, find_ghosts=False)
118
def fetch_refs(self, update_refs, lossy, overwrite=False):
119
"""Fetch possibly roundtripped revisions into the target repository
122
:param update_refs: Generate refs to fetch. Receives dictionary
123
with old refs (git shas), returns dictionary of new names to
125
:param lossy: Whether to roundtrip
126
:return: old refs, new refs
128
raise NotImplementedError(self.fetch_refs)
130
def search_missing_revision_ids(self,
131
find_ghosts=True, revision_ids=None,
132
if_present_ids=None, limit=None):
133
if limit is not None:
134
raise FetchLimitUnsupported(self)
138
todo.extend(revision_ids)
140
todo.extend(revision_ids)
141
with self.source_store.lock_read():
142
for revid in revision_ids:
143
if revid == NULL_REVISION:
146
git_sha = self.source_store._lookup_revision_sha1(revid)
148
raise NoSuchRevision(revid, self.source)
149
git_shas.append(git_sha)
154
sha for sha in self.target.controldir.get_refs_container().as_dict().values()
156
missing_revids = set()
158
for (kind, type_data) in self.source_store.lookup_git_sha(
161
missing_revids.add(type_data[0])
162
return self.source.revision_ids_to_search_result(missing_revids)
164
def _warn_slow(self):
165
if not config.GlobalConfig().suppress_warning('slow_intervcs_push'):
167
'Pushing from a Bazaar to a Git repository. '
168
'For better performance, push into a Bazaar repository.')
171
class InterToLocalGitRepository(InterToGitRepository):
172
"""InterBranch implementation between a Bazaar and a Git repository."""
174
def __init__(self, source, target):
175
super(InterToLocalGitRepository, self).__init__(source, target)
176
self.target_store = self.target.controldir._git.object_store
177
self.target_refs = self.target.controldir._git.refs
179
def _commit_needs_fetching(self, sha_id):
181
return (sha_id not in self.target_store)
182
except NoSuchRevision:
186
def _revision_needs_fetching(self, sha_id, revid):
187
if revid == NULL_REVISION:
191
sha_id = self.source_store._lookup_revision_sha1(revid)
194
return self._commit_needs_fetching(sha_id)
196
def missing_revisions(self, stop_revisions):
197
"""Find the revisions that are missing from the target repository.
199
:param stop_revisions: Revisions to check for (tuples with
201
:return: sequence of missing revisions, in topological order
202
:raise: NoSuchRevision if the stop_revisions are not present in
207
for (sha1, revid) in stop_revisions:
208
if sha1 is not None and revid is not None:
209
revid_sha_map[revid] = sha1
210
stop_revids.append(revid)
211
elif sha1 is not None:
212
if self._commit_needs_fetching(sha1):
213
for (kind, (revid, tree_sha, verifiers)) in self.source_store.lookup_git_sha(sha1):
214
revid_sha_map[revid] = sha1
215
stop_revids.append(revid)
219
stop_revids.append(revid)
221
graph = self.source.get_graph()
222
with ui.ui_factory.nested_progress_bar() as pb:
225
for revid in stop_revids:
226
sha1 = revid_sha_map.get(revid)
227
if (revid not in missing and
228
self._revision_needs_fetching(sha1, revid)):
230
new_stop_revids.append(revid)
232
parent_map = graph.get_parent_map(new_stop_revids)
233
for parent_revids in viewvalues(parent_map):
234
stop_revids.update(parent_revids)
235
pb.update("determining revisions to fetch", len(missing))
236
return graph.iter_topo_order(missing)
238
def _get_target_bzr_refs(self):
239
"""Return a dictionary with references.
241
:return: Dictionary with reference names as keys and tuples
242
with Git SHA, Bazaar revid as values.
245
for k in self.target._git.refs.allkeys():
247
v = self.target._git.refs.read_ref(k)
252
if v and not v.startswith(SYMREF):
254
for (kind, type_data) in self.source_store.lookup_git_sha(
256
if kind == "commit" and self.source.has_revision(
262
bzr_refs[k] = (v, revid)
265
def fetch_refs(self, update_refs, lossy, overwrite=False):
268
with self.source_store.lock_read():
269
old_refs = self._get_target_bzr_refs()
270
new_refs = update_refs(old_refs)
271
revidmap = self.fetch_objects(
272
[(git_sha, bzr_revid)
273
for (git_sha, bzr_revid) in new_refs.values()
274
if git_sha is None or not git_sha.startswith(SYMREF)],
276
for name, (gitid, revid) in viewitems(new_refs):
279
gitid = revidmap[revid][0]
281
gitid = self.source_store._lookup_revision_sha1(revid)
282
if gitid.startswith(SYMREF):
283
self.target_refs.set_symbolic_ref(
284
name, gitid[len(SYMREF):])
287
old_git_id = old_refs[name][0]
289
self.target_refs.add_if_new(name, gitid)
291
self.target_refs.set_if_equals(name, old_git_id, gitid)
292
result_refs[name] = (gitid, revid if not lossy else self.mapping.revision_id_foreign_to_bzr(gitid))
293
return revidmap, old_refs, result_refs
295
def fetch_objects(self, revs, lossy, limit=None):
296
if not lossy and not self.mapping.roundtripping:
297
for git_sha, bzr_revid in revs:
298
if (bzr_revid is not None and
299
needs_roundtripping(self.source, bzr_revid)):
300
raise NoPushSupport(self.source, self.target, self.mapping,
302
with self.source_store.lock_read():
303
todo = list(self.missing_revisions(revs))[:limit]
305
with ui.ui_factory.nested_progress_bar() as pb:
306
object_generator = MissingObjectsIterator(
307
self.source_store, self.source, pb)
308
for (old_revid, git_sha) in object_generator.import_revisions(
311
new_revid = self.mapping.revision_id_foreign_to_bzr(
314
new_revid = old_revid
316
self.mapping.revision_id_bzr_to_foreign(old_revid)
317
except InvalidRevisionId:
319
revidmap[old_revid] = (git_sha, new_revid)
320
self.target_store.add_objects(object_generator)
323
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
324
fetch_spec=None, mapped_refs=None, lossy=False):
325
if mapped_refs is not None:
326
stop_revisions = mapped_refs
327
elif revision_id is not None:
328
stop_revisions = [(None, revision_id)]
329
elif fetch_spec is not None:
330
recipe = fetch_spec.get_recipe()
331
if recipe[0] in ("search", "proxy-search"):
332
stop_revisions = [(None, revid) for revid in recipe[1]]
334
raise AssertionError(
335
"Unsupported search result type %s" % recipe[0])
337
stop_revisions = [(None, revid)
338
for revid in self.source.all_revision_ids()]
341
revidmap = self.fetch_objects(stop_revisions, lossy=lossy)
342
except NoPushSupport:
343
raise NoRoundtrippingSupport(self.source, self.target)
344
return FetchResult(revidmap)
347
def is_compatible(source, target):
348
"""Be compatible with GitRepository."""
349
return (not isinstance(source, GitRepository) and
350
isinstance(target, LocalGitRepository))
353
class InterToRemoteGitRepository(InterToGitRepository):
355
def fetch_refs(self, update_refs, lossy, overwrite=False):
356
"""Import the gist of the ancestry of a particular revision."""
357
if not lossy and not self.mapping.roundtripping:
358
raise NoPushSupport(self.source, self.target, self.mapping)
359
unpeel_map = UnpeelMap.from_repository(self.source)
362
def git_update_refs(old_refs):
365
k: (v, None) for (k, v) in viewitems(old_refs)}
366
new_refs = update_refs(self.old_refs)
367
for name, (gitid, revid) in viewitems(new_refs):
369
git_sha = self.source_store._lookup_revision_sha1(revid)
370
gitid = unpeel_map.re_unpeel_tag(
371
git_sha, old_refs.get(name))
373
if remote_divergence(
374
old_refs.get(name), gitid, self.source_store):
375
raise DivergedBranches(self.source, self.target)
379
with self.source_store.lock_read():
380
result = self.target.send_pack(
381
git_update_refs, self.source_store.generate_lossy_pack_data)
382
if result is not None and not isinstance(result, dict):
383
for ref, error in result.ref_status.items():
385
raise RemoteGitError(
386
'unable to update ref %r: %s' % (ref, error))
387
new_refs = result.refs
388
else: # dulwich < 0.20.3
391
return revidmap, self.old_refs, new_refs
394
def is_compatible(source, target):
395
"""Be compatible with GitRepository."""
396
return (not isinstance(source, GitRepository) and
397
isinstance(target, RemoteGitRepository))
400
class GitSearchResult(object):
402
def __init__(self, start, exclude, keys):
404
self._exclude = exclude
410
def get_recipe(self):
411
return ('search', self._start, self._exclude, len(self._keys))
414
class InterFromGitRepository(InterRepository):
416
_matching_repo_format = GitRepositoryFormat()
418
def _target_has_shas(self, shas):
419
raise NotImplementedError(self._target_has_shas)
421
def get_determine_wants_heads(self, wants, include_tags=False, tag_selector=None):
424
def determine_wants(refs):
426
for k, v in viewitems(refs):
427
if k.endswith(ANNOTATED_TAG_SUFFIX):
428
unpeel_lookup[v] = refs[k[:-len(ANNOTATED_TAG_SUFFIX)]]
429
potential = set([unpeel_lookup.get(w, w) for w in wants])
431
for k, sha in viewitems(refs):
432
if k.endswith(ANNOTATED_TAG_SUFFIX):
435
tag_name = ref_to_tag_name(k)
438
if tag_selector and not tag_selector(tag_name):
443
return list(potential - self._target_has_shas(potential))
444
return determine_wants
446
def determine_wants_all(self, refs):
447
raise NotImplementedError(self.determine_wants_all)
450
def _get_repo_format_to_test():
453
def copy_content(self, revision_id=None):
454
"""See InterRepository.copy_content."""
455
self.fetch(revision_id, find_ghosts=False)
457
def search_missing_revision_ids(self,
458
find_ghosts=True, revision_ids=None,
459
if_present_ids=None, limit=None):
460
if limit is not None:
461
raise FetchLimitUnsupported(self)
462
if revision_ids is None and if_present_ids is None:
463
todo = set(self.source.all_revision_ids())
466
if revision_ids is not None:
467
for revid in revision_ids:
468
if not self.source.has_revision(revid):
469
raise NoSuchRevision(revid, self.source)
470
todo.update(revision_ids)
471
if if_present_ids is not None:
472
todo.update(if_present_ids)
473
result_set = todo.difference(self.target.all_revision_ids())
474
result_parents = set(itertools.chain.from_iterable(viewvalues(
475
self.source.get_graph().get_parent_map(result_set))))
476
included_keys = result_set.intersection(result_parents)
477
start_keys = result_set.difference(included_keys)
478
exclude_keys = result_parents.difference(result_set)
479
return GitSearchResult(start_keys, exclude_keys, result_set)
482
class InterGitNonGitRepository(InterFromGitRepository):
483
"""Base InterRepository that copies revisions from a Git into a non-Git
486
def _target_has_shas(self, shas):
490
revid = self.source.lookup_foreign_revision_id(sha)
491
except NotCommitError:
492
# Commit is definitely not present
496
return set([revids[r] for r in self.target.has_revisions(revids)])
498
def determine_wants_all(self, refs):
500
for k, v in viewitems(refs):
501
# For non-git target repositories, only worry about peeled
504
potential.add(self.source.controldir.get_peeled(k) or v)
505
return list(potential - self._target_has_shas(potential))
507
def _warn_slow(self):
508
if not config.GlobalConfig().suppress_warning('slow_intervcs_push'):
510
'Fetching from Git to Bazaar repository. '
511
'For better performance, fetch into a Git repository.')
513
def fetch_objects(self, determine_wants, mapping, limit=None, lossy=False):
514
"""Fetch objects from a remote server.
516
:param determine_wants: determine_wants callback
517
:param mapping: BzrGitMapping to use
518
:param limit: Maximum number of commits to import.
519
:return: Tuple with pack hint, last imported revision id and remote
522
raise NotImplementedError(self.fetch_objects)
524
def get_determine_wants_revids(self, revids, include_tags=False, tag_selector=None):
526
for revid in set(revids):
527
if self.target.has_revision(revid):
529
git_sha, mapping = self.source.lookup_bzr_revision_id(revid)
531
return self.get_determine_wants_heads(
532
wants, include_tags=include_tags, tag_selector=tag_selector)
534
def fetch(self, revision_id=None, find_ghosts=False,
535
mapping=None, fetch_spec=None, include_tags=False, lossy=False):
537
mapping = self.source.get_mapping()
538
if revision_id is not None:
539
interesting_heads = [revision_id]
540
elif fetch_spec is not None:
541
recipe = fetch_spec.get_recipe()
542
if recipe[0] in ("search", "proxy-search"):
543
interesting_heads = recipe[1]
545
raise AssertionError("Unsupported search result type %s" %
548
interesting_heads = None
550
if interesting_heads is not None:
551
determine_wants = self.get_determine_wants_revids(
552
interesting_heads, include_tags=include_tags)
554
determine_wants = self.determine_wants_all
556
(pack_hint, _, remote_refs) = self.fetch_objects(
557
determine_wants, mapping, lossy=lossy)
558
if pack_hint is not None and self.target._format.pack_compresses:
559
self.target.pack(hint=pack_hint)
560
result = FetchResult()
561
result.refs = remote_refs
565
class InterRemoteGitNonGitRepository(InterGitNonGitRepository):
566
"""InterRepository that copies revisions from a remote Git into a non-Git
569
def get_target_heads(self):
570
# FIXME: This should be more efficient
571
all_revs = self.target.all_revision_ids()
572
parent_map = self.target.get_parent_map(all_revs)
574
for values in viewvalues(parent_map):
575
all_parents.update(values)
576
return set(all_revs) - all_parents
578
def fetch_objects(self, determine_wants, mapping, limit=None, lossy=False):
579
"""See `InterGitNonGitRepository`."""
581
store = get_object_store(self.target, mapping)
582
with store.lock_write():
583
heads = self.get_target_heads()
584
graph_walker = ObjectStoreGraphWalker(
585
[store._lookup_revision_sha1(head) for head in heads],
586
lambda sha: store[sha].parents)
587
wants_recorder = DetermineWantsRecorder(determine_wants)
589
with ui.ui_factory.nested_progress_bar() as pb:
590
objects_iter = self.source.fetch_objects(
591
wants_recorder, graph_walker, store.get_raw)
592
trace.mutter("Importing %d new revisions",
593
len(wants_recorder.wants))
594
(pack_hint, last_rev) = import_git_objects(
595
self.target, mapping, objects_iter, store,
596
wants_recorder.wants, pb, limit)
597
return (pack_hint, last_rev, wants_recorder.remote_refs)
600
def is_compatible(source, target):
601
"""Be compatible with GitRepository."""
602
if not isinstance(source, RemoteGitRepository):
604
if not target.supports_rich_root():
606
if isinstance(target, GitRepository):
608
if not getattr(target._format, "supports_full_versioned_files", True):
613
class InterLocalGitNonGitRepository(InterGitNonGitRepository):
614
"""InterRepository that copies revisions from a local Git into a non-Git
617
def fetch_objects(self, determine_wants, mapping, limit=None, lossy=False):
618
"""See `InterGitNonGitRepository`."""
620
remote_refs = self.source.controldir.get_refs_container().as_dict()
621
wants = determine_wants(remote_refs)
622
target_git_object_retriever = get_object_store(self.target, mapping)
623
with ui.ui_factory.nested_progress_bar() as pb:
624
target_git_object_retriever.lock_write()
626
(pack_hint, last_rev) = import_git_objects(
627
self.target, mapping, self.source._git.object_store,
628
target_git_object_retriever, wants, pb, limit)
629
return (pack_hint, last_rev, remote_refs)
631
target_git_object_retriever.unlock()
634
def is_compatible(source, target):
635
"""Be compatible with GitRepository."""
636
if not isinstance(source, LocalGitRepository):
638
if not target.supports_rich_root():
640
if isinstance(target, GitRepository):
642
if not getattr(target._format, "supports_full_versioned_files", True):
647
class InterGitGitRepository(InterFromGitRepository):
648
"""InterRepository that copies between Git repositories."""
650
def fetch_refs(self, update_refs, lossy, overwrite=False):
652
raise LossyPushToSameVCS(self.source, self.target)
653
old_refs = self.target.controldir.get_refs_container()
656
def determine_wants(heads):
657
old_refs = dict([(k, (v, None))
658
for (k, v) in viewitems(heads.as_dict())])
659
new_refs = update_refs(old_refs)
660
ref_changes.update(new_refs)
661
return [sha1 for (sha1, bzr_revid) in viewvalues(new_refs)]
662
self.fetch_objects(determine_wants, lossy=lossy)
663
for k, (git_sha, bzr_revid) in viewitems(ref_changes):
664
self.target._git.refs[k] = git_sha
665
new_refs = self.target.controldir.get_refs_container()
666
return None, old_refs, new_refs
668
def fetch_objects(self, determine_wants, mapping=None, limit=None,
670
raise NotImplementedError(self.fetch_objects)
672
def _target_has_shas(self, shas):
674
[sha for sha in shas if sha in self.target._git.object_store])
676
def fetch(self, revision_id=None, find_ghosts=False,
677
mapping=None, fetch_spec=None, branches=None, limit=None,
678
include_tags=False, lossy=False):
680
mapping = self.source.get_mapping()
681
if revision_id is not None:
683
elif fetch_spec is not None:
684
recipe = fetch_spec.get_recipe()
685
if recipe[0] in ("search", "proxy-search"):
688
raise AssertionError(
689
"Unsupported search result type %s" % recipe[0])
691
if branches is not None:
692
determine_wants = self.get_determine_wants_branches(
693
branches, include_tags=include_tags)
694
elif fetch_spec is None and revision_id is None:
695
determine_wants = self.determine_wants_all
697
determine_wants = self.get_determine_wants_revids(
698
args, include_tags=include_tags)
699
wants_recorder = DetermineWantsRecorder(determine_wants)
700
self.fetch_objects(wants_recorder, mapping, limit=limit, lossy=lossy)
701
result = FetchResult()
702
result.refs = wants_recorder.remote_refs
705
def get_determine_wants_revids(self, revids, include_tags=False, tag_selector=None):
707
for revid in set(revids):
708
if revid == NULL_REVISION:
710
git_sha, mapping = self.source.lookup_bzr_revision_id(revid)
712
return self.get_determine_wants_heads(wants, include_tags=include_tags, tag_selector=tag_selector)
714
def get_determine_wants_branches(self, branches, include_tags=False):
715
def determine_wants(refs):
717
for name, value in viewitems(refs):
718
if value == ZERO_SHA:
721
if name.endswith(ANNOTATED_TAG_SUFFIX):
724
if name in branches or (include_tags and is_tag(name)):
727
return determine_wants
729
def determine_wants_all(self, refs):
731
v for k, v in refs.items()
732
if not v == ZERO_SHA and not k.endswith(ANNOTATED_TAG_SUFFIX)])
733
return list(potential - self._target_has_shas(potential))
736
class InterLocalGitLocalGitRepository(InterGitGitRepository):
738
def fetch_objects(self, determine_wants, mapping=None, limit=None,
741
raise LossyPushToSameVCS(self.source, self.target)
742
if limit is not None:
743
raise FetchLimitUnsupported(self)
744
from .remote import DefaultProgressReporter
745
with ui.ui_factory.nested_progress_bar() as pb:
746
progress = DefaultProgressReporter(pb).progress
747
refs = self.source._git.fetch(
748
self.target._git, determine_wants,
750
return (None, None, refs)
753
def is_compatible(source, target):
754
"""Be compatible with GitRepository."""
755
return (isinstance(source, LocalGitRepository) and
756
isinstance(target, LocalGitRepository))
759
class InterRemoteGitLocalGitRepository(InterGitGitRepository):
761
def fetch_objects(self, determine_wants, mapping=None, limit=None,
764
raise LossyPushToSameVCS(self.source, self.target)
765
if limit is not None:
766
raise FetchLimitUnsupported(self)
767
graphwalker = self.target._git.get_graph_walker()
768
if (CAPABILITY_THIN_PACK in
769
self.source.controldir._client._fetch_capabilities):
770
# TODO(jelmer): Avoid reading entire file into memory and
771
# only processing it after the whole file has been fetched.
777
self.target._git.object_store.move_in_thin_pack(f)
782
f, commit, abort = self.target._git.object_store.add_pack()
784
refs = self.source.controldir.fetch_pack(
785
determine_wants, graphwalker, f.write)
787
return (None, None, refs)
788
except BaseException:
793
def is_compatible(source, target):
794
"""Be compatible with GitRepository."""
795
return (isinstance(source, RemoteGitRepository) and
796
isinstance(target, LocalGitRepository))