14
14
# along with this program; if not, write to the Free Software
15
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
from bzrlib import osutils
18
from bzrlib.errors import InvalidRevisionId
19
from bzrlib.inventory import Inventory
20
from bzrlib.repository import InterRepository
21
from bzrlib.trace import info
23
from bzrlib.plugins.git import git
24
from bzrlib.plugins.git.repository import LocalGitRepository, GitRepository, GitFormat
25
from bzrlib.plugins.git.remote import RemoteGitRepository
27
from dulwich.objects import Commit
29
from cStringIO import StringIO
17
from cStringIO import (
21
from dulwich.client import (
22
SimpleFetchGraphWalker,
24
from dulwich.objects import (
34
from bzrlib.errors import (
38
from bzrlib.inventory import (
41
from bzrlib.repository import (
44
from bzrlib.tsort import (
48
from bzrlib.plugins.git.converter import (
51
from bzrlib.plugins.git.repository import (
56
from bzrlib.plugins.git.remote import (
32
61
class BzrFetchGraphWalker(object):
62
"""GraphWalker implementation that uses a Bazaar repository."""
34
64
def __init__(self, repository, mapping):
35
65
self.repository = repository
58
91
self.heads.update([p for p in ps if not p in self.done])
61
return self.mapping.revision_id_bzr_to_foreign(ret)
94
return self.mapping.revision_id_bzr_to_foreign(ret)[0]
62
95
except InvalidRevisionId:
67
def import_git_blob(repo, mapping, path, blob):
100
def import_git_blob(texts, mapping, path, blob, inv, parent_invs, shagitmap,
68
102
"""Import a git blob object into a bzr repository.
70
:param repo: bzr repository
104
:param texts: VersionedFiles to add to
71
105
:param path: Path in the tree
72
106
:param blob: A git blob
107
:return: Inventory entry
74
109
file_id = mapping.generate_file_id(path)
75
repo.texts.add_lines((file_id, blob.id),
110
# We just have to hope this is indeed utf-8:
111
ie = inv.add_path(path.decode("utf-8"), "file", file_id)
112
ie.text_size = len(blob.data)
113
ie.text_sha1 = osutils.sha_string(blob.data)
114
ie.executable = executable
115
# See if this is the same revision as one of the parents unchanged
117
for pinv in parent_invs:
118
if not file_id in pinv:
120
if pinv[file_id].text_sha1 == ie.text_sha1:
121
ie.revision = pinv[file_id].revision
123
parent_keys.append((file_id, pinv[file_id].revision))
124
ie.revision = inv.revision_id
125
assert file_id is not None
126
assert ie.revision is not None
127
texts.add_lines((file_id, ie.revision), parent_keys,
77
128
osutils.split_lines(blob.data))
78
inv.add_path(path, "file", file_id)
81
def import_git_tree(repo, mapping, path, tree, inv, lookup_object):
129
shagitmap.add_entry(blob.sha().hexdigest(), "blob",
130
(ie.file_id, ie.revision))
134
def import_git_tree(texts, mapping, path, tree, inv, parent_invs, shagitmap,
82
136
"""Import a git tree object into a bzr repository.
84
:param repo: A Bzr repository object
138
:param texts: VersionedFiles object to add to
85
139
:param path: Path in the tree
86
140
:param tree: A git tree object
87
141
:param inv: Inventory object
89
143
file_id = mapping.generate_file_id(path)
90
repo.texts.add_lines((file_id, tree.id),
93
inv.add_path(path, "directory", file_id)
144
# We just have to hope this is indeed utf-8:
145
ie = inv.add_path(path.decode("utf-8"), "directory", file_id)
148
for pinv in parent_invs:
149
if not file_id in pinv:
152
tree_sha = shagitmap.lookup_tree(path, pinv[file_id].revision)
156
if tree_sha == tree.id:
157
ie.revision = pinv[file_id].revision
159
parent_keys.append((file_id, pinv[file_id].revision))
160
if ie.revision is None:
161
ie.revision = inv.revision_id
162
texts.add_lines((file_id, ie.revision), parent_keys, [])
163
shagitmap.add_entry(tree.id, "tree", (file_id, ie.revision))
94
164
for mode, name, hexsha in tree.entries():
95
165
entry_kind = (mode & 0700000) / 0100000
96
166
basename = name.decode("utf-8")
100
170
child_path = urlutils.join(path, name)
171
obj = lookup_object(hexsha)
101
172
if entry_kind == 0:
102
import_git_tree(repo, mapping, child_path, lookup_object, inv)
173
import_git_tree(texts, mapping, child_path, obj, inv, parent_invs,
174
shagitmap, lookup_object)
103
175
elif entry_kind == 1:
104
import_git_blob(repo, mapping, child_path, lookup_object, inv)
176
fs_mode = mode & 0777
177
import_git_blob(texts, mapping, child_path, obj, inv, parent_invs,
178
shagitmap, bool(fs_mode & 0111))
106
180
raise AssertionError("Unknown blob kind, perms=%r." % (mode,))
109
def import_git_objects(repo, mapping, object_iter):
184
def import_git_objects(repo, mapping, object_iter, target_git_object_retriever,
110
186
"""Import a set of git objects into a bzr repository.
112
188
:param repo: Bazaar repository
114
190
:param object_iter: Iterator over Git objects.
116
192
# TODO: a more (memory-)efficient implementation of this
118
for o in object_iter:
121
198
# Find and convert commit objects
122
for o in objects.iterkeys():
201
pb.update("finding revisions to fetch", len(graph), None)
203
assert isinstance(head, str)
204
o = object_iter[head]
123
205
if isinstance(o, Commit):
124
206
rev = mapping.import_commit(o)
125
root_trees[rev] = objects[o.tree_sha]
207
if repo.has_revision(rev.revision_id):
209
root_trees[rev.revision_id] = o.tree
210
revisions[rev.revision_id] = rev
211
graph.append((rev.revision_id, rev.parent_ids))
212
target_git_object_retriever._idmap.add_entry(o.sha().hexdigest(),
213
"commit", (rev.revision_id, o._tree))
214
heads.extend([p for p in o.parents if p not in checked])
216
trace.warning("Unable to import head object %r" % o)
218
# Order the revisions
126
219
# Create the inventory objects
127
for rev, root_tree in root_trees.iteritems():
220
for i, revid in enumerate(topo_sort(graph)):
222
pb.update("fetching revisions", i, len(graph))
223
root_tree = object_iter[root_trees[revid]]
224
rev = revisions[revid]
128
225
# We have to do this here, since we have to walk the tree and
129
# we need to make sure to import the blobs / trees with the riht
226
# we need to make sure to import the blobs / trees with the right
130
227
# path; this may involve adding them more than once.
131
228
inv = Inventory()
229
inv.revision_id = rev.revision_id
132
230
def lookup_object(sha):
135
return reconstruct_git_object(repo, mapping, sha)
136
import_git_tree(repo, mapping, "", tree, inv, lookup_object)
231
if sha in object_iter:
232
return object_iter[sha]
233
return target_git_object_retriever[sha]
234
parent_invs = [repo.get_inventory(r) for r in rev.parent_ids]
235
import_git_tree(repo.texts, mapping, "", root_tree, inv, parent_invs,
236
target_git_object_retriever._idmap, lookup_object)
137
237
repo.add_revision(rev.revision_id, rev, inv)
140
def reconstruct_git_commit(repo, rev):
141
raise NotImplementedError(self.reconstruct_git_commit)
144
def reconstruct_git_object(repo, mapping, sha):
146
revid = mapping.revision_id_foreign_to_bzr(sha)
148
rev = repo.get_revision(revid)
149
except NoSuchRevision:
152
return reconstruct_git_commit(rev)
156
raise KeyError("No such object %s" % sha)
159
class InterGitRepository(InterRepository):
161
_matching_repo_format = GitFormat()
238
target_git_object_retriever._idmap.commit()
241
class InterGitNonGitRepository(InterRepository):
242
"""InterRepository that copies revisions from a Git into a non-Git
245
_matching_repo_format = GitRepositoryFormat()
164
248
def _get_repo_format_to_test():
168
252
"""See InterRepository.copy_content."""
169
253
self.fetch(revision_id, pb, find_ghosts=False)
171
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
174
mapping = self.source.get_mapping()
255
def fetch_objects(self, determine_wants, mapping, pb=None):
175
256
def progress(text):
177
pb.note("git: %s" % text)
179
info("git: %s" % text)
180
def determine_wants(heads):
181
if revision_id is None:
184
ret = [mapping.revision_id_bzr_to_foreign(revision_id)]
185
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
257
pb.update("git: %s" % text.rstrip("\r\n"), 0, 0)
186
258
graph_walker = BzrFetchGraphWalker(self.target, mapping)
187
self.target.lock_write()
261
create_pb = pb = ui.ui_factory.nested_progress_bar()
262
target_git_object_retriever = GitObjectConverter(self.target, mapping)
265
def record_determine_wants(heads):
266
wants = determine_wants(heads)
267
recorded_wants.extend(wants)
189
import_git_objects(self.target, mapping,
190
self.source.fetch_objects(determine_wants, graph_walker,
271
self.target.lock_write()
273
self.target.start_write_group()
275
objects_iter = self.source.fetch_objects(
276
record_determine_wants,
278
target_git_object_retriever.__getitem__,
280
import_git_objects(self.target, mapping, objects_iter,
281
target_git_object_retriever, recorded_wants, pb)
283
self.target.commit_write_group()
290
def fetch(self, revision_id=None, pb=None, find_ghosts=False, mapping=None,
292
self.fetch_refs(revision_id=revision_id, pb=pb, find_ghosts=find_ghosts,
293
mapping=mapping, fetch_spec=fetch_spec)
295
def fetch_refs(self, revision_id=None, pb=None, find_ghosts=False,
296
mapping=None, fetch_spec=None):
298
mapping = self.source.get_mapping()
299
if revision_id is not None:
300
interesting_heads = [revision_id]
301
elif fetch_spec is not None:
302
interesting_heads = fetch_spec.heads
304
interesting_heads = None
306
def determine_wants(refs):
308
if interesting_heads is None:
309
ret = [sha for (ref, sha) in refs.iteritems() if not ref.endswith("^{}")]
311
ret = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in interesting_heads]
312
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
313
self.fetch_objects(determine_wants, mapping, pb)
196
317
def is_compatible(source, target):
197
318
"""Be compatible with GitRepository."""
198
319
# FIXME: Also check target uses VersionedFile
199
return (isinstance(source, LocalGitRepository) and
200
target.supports_rich_root())
320
return (isinstance(source, GitRepository) and
321
target.supports_rich_root() and
322
not isinstance(target, GitRepository))
325
class InterGitRepository(InterRepository):
326
"""InterRepository that copies between Git repositories."""
328
_matching_repo_format = GitRepositoryFormat()
331
def _get_repo_format_to_test():
334
def copy_content(self, revision_id=None, pb=None):
335
"""See InterRepository.copy_content."""
336
self.fetch(revision_id, pb, find_ghosts=False)
338
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
339
mapping=None, fetch_spec=None):
341
mapping = self.source.get_mapping()
343
trace.info("git: %s", text)
345
if revision_id is not None:
346
args = [mapping.revision_id_bzr_to_foreign(revision_id)[0]]
347
elif fetch_spec is not None:
348
args = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in fetch_spec.heads]
349
if fetch_spec is None and revision_id is None:
350
determine_wants = r.object_store.determine_wants_all
352
determine_wants = lambda x: [y for y in args if not y in r.object_store]
354
graphwalker = SimpleFetchGraphWalker(r.heads().values(), r.get_parents)
355
f, commit = r.object_store.add_pack()
357
self.source._git.fetch_pack(path, determine_wants, graphwalker, f.write, progress)
365
def is_compatible(source, target):
366
"""Be compatible with GitRepository."""
367
return (isinstance(source, GitRepository) and
368
isinstance(target, GitRepository))