14
14
# along with this program; if not, write to the Free Software
15
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
from bzrlib import osutils, ui, urlutils
18
from bzrlib.errors import InvalidRevisionId
19
from bzrlib.inventory import Inventory
20
from bzrlib.repository import InterRepository
21
from bzrlib.trace import info
22
from bzrlib.tsort import topo_sort
24
from bzrlib.plugins.git import git
17
from cStringIO import (
21
from dulwich.client import (
22
SimpleFetchGraphWalker,
24
from dulwich.objects import (
34
from bzrlib.errors import (
38
from bzrlib.inventory import (
41
from bzrlib.repository import (
44
from bzrlib.tsort import (
48
from bzrlib.plugins.git.converter import (
25
51
from bzrlib.plugins.git.repository import (
30
from bzrlib.plugins.git.remote import RemoteGitRepository
32
from dulwich.objects import Commit
34
from cStringIO import StringIO
56
from bzrlib.plugins.git.remote import (
37
61
class BzrFetchGraphWalker(object):
62
"""GraphWalker implementation that uses a Bazaar repository."""
39
64
def __init__(self, repository, mapping):
40
65
self.repository = repository
63
91
self.heads.update([p for p in ps if not p in self.done])
66
return self.mapping.revision_id_bzr_to_foreign(ret)
94
return self.mapping.revision_id_bzr_to_foreign(ret)[0]
67
95
except InvalidRevisionId:
72
def import_git_blob(repo, mapping, path, blob, inv, parent_invs, executable):
100
def import_git_blob(texts, mapping, path, blob, inv, parent_invs, shagitmap,
73
102
"""Import a git blob object into a bzr repository.
75
:param repo: bzr repository
104
:param texts: VersionedFiles to add to
76
105
:param path: Path in the tree
77
106
:param blob: A git blob
107
:return: Inventory entry
79
109
file_id = mapping.generate_file_id(path)
80
text_revision = inv.revision_id
81
repo.texts.add_lines((file_id, text_revision),
82
[(file_id, p[file_id].revision) for p in parent_invs if file_id in p],
83
osutils.split_lines(blob.data))
84
ie = inv.add_path(path, "file", file_id)
85
ie.revision = text_revision
110
# We just have to hope this is indeed utf-8:
111
ie = inv.add_path(path.decode("utf-8"), "file", file_id)
86
112
ie.text_size = len(blob.data)
87
113
ie.text_sha1 = osutils.sha_string(blob.data)
88
114
ie.executable = executable
91
def import_git_tree(repo, mapping, path, tree, inv, parent_invs, lookup_object):
115
# See if this is the same revision as one of the parents unchanged
117
for pinv in parent_invs:
118
if not file_id in pinv:
120
if pinv[file_id].text_sha1 == ie.text_sha1:
121
ie.revision = pinv[file_id].revision
123
parent_keys.append((file_id, pinv[file_id].revision))
124
ie.revision = inv.revision_id
125
assert file_id is not None
126
assert ie.revision is not None
127
texts.add_lines((file_id, ie.revision), parent_keys,
128
osutils.split_lines(blob.data))
129
shagitmap.add_entry(blob.sha().hexdigest(), "blob",
130
(ie.file_id, ie.revision))
134
def import_git_tree(texts, mapping, path, tree, inv, parent_invs, shagitmap,
92
136
"""Import a git tree object into a bzr repository.
94
:param repo: A Bzr repository object
138
:param texts: VersionedFiles object to add to
95
139
:param path: Path in the tree
96
140
:param tree: A git tree object
97
141
:param inv: Inventory object
99
143
file_id = mapping.generate_file_id(path)
100
text_revision = inv.revision_id
101
repo.texts.add_lines((file_id, text_revision),
102
[(file_id, p[file_id].revision) for p in parent_invs if file_id in p],
104
ie = inv.add_path(path, "directory", file_id)
105
ie.revision = text_revision
144
# We just have to hope this is indeed utf-8:
145
ie = inv.add_path(path.decode("utf-8"), "directory", file_id)
148
for pinv in parent_invs:
149
if not file_id in pinv:
152
tree_sha = shagitmap.lookup_tree(path, pinv[file_id].revision)
156
if tree_sha == tree.id:
157
ie.revision = pinv[file_id].revision
159
parent_keys.append((file_id, pinv[file_id].revision))
160
if ie.revision is None:
161
ie.revision = inv.revision_id
162
texts.add_lines((file_id, ie.revision), parent_keys, [])
163
shagitmap.add_entry(tree.id, "tree", (file_id, ie.revision))
106
164
for mode, name, hexsha in tree.entries():
107
165
entry_kind = (mode & 0700000) / 0100000
108
166
basename = name.decode("utf-8")
110
168
child_path = name
112
170
child_path = urlutils.join(path, name)
171
obj = lookup_object(hexsha)
113
172
if entry_kind == 0:
114
tree = lookup_object(hexsha)
115
import_git_tree(repo, mapping, child_path, tree, inv, parent_invs, lookup_object)
173
import_git_tree(texts, mapping, child_path, obj, inv, parent_invs,
174
shagitmap, lookup_object)
116
175
elif entry_kind == 1:
117
blob = lookup_object(hexsha)
118
176
fs_mode = mode & 0777
119
import_git_blob(repo, mapping, child_path, blob, inv, parent_invs, bool(fs_mode & 0111))
177
import_git_blob(texts, mapping, child_path, obj, inv, parent_invs,
178
shagitmap, bool(fs_mode & 0111))
121
180
raise AssertionError("Unknown blob kind, perms=%r." % (mode,))
124
def import_git_objects(repo, mapping, object_iter, pb=None):
184
def import_git_objects(repo, mapping, object_iter, target_git_object_retriever,
125
186
"""Import a set of git objects into a bzr repository.
127
188
:param repo: Bazaar repository
129
190
:param object_iter: Iterator over Git objects.
131
192
# TODO: a more (memory-)efficient implementation of this
133
for i, o in enumerate(object_iter):
135
pb.update("fetching objects", i)
140
198
# Find and convert commit objects
141
for o in objects.itervalues():
201
pb.update("finding revisions to fetch", len(graph), None)
203
assert isinstance(head, str)
204
o = object_iter[head]
142
205
if isinstance(o, Commit):
143
206
rev = mapping.import_commit(o)
144
root_trees[rev.revision_id] = objects[o.tree]
207
if repo.has_revision(rev.revision_id):
209
root_trees[rev.revision_id] = o.tree
145
210
revisions[rev.revision_id] = rev
146
211
graph.append((rev.revision_id, rev.parent_ids))
212
target_git_object_retriever._idmap.add_entry(o.sha().hexdigest(),
213
"commit", (rev.revision_id, o._tree))
214
heads.extend([p for p in o.parents if p not in checked])
216
trace.warning("Unable to import head object %r" % o)
147
218
# Order the revisions
148
219
# Create the inventory objects
149
220
for i, revid in enumerate(topo_sort(graph)):
150
221
if pb is not None:
151
222
pb.update("fetching revisions", i, len(graph))
152
root_tree = root_trees[revid]
223
root_tree = object_iter[root_trees[revid]]
153
224
rev = revisions[revid]
154
225
# We have to do this here, since we have to walk the tree and
155
# we need to make sure to import the blobs / trees with the riht
226
# we need to make sure to import the blobs / trees with the right
156
227
# path; this may involve adding them more than once.
157
228
inv = Inventory()
158
229
inv.revision_id = rev.revision_id
159
230
def lookup_object(sha):
162
return reconstruct_git_object(repo, mapping, sha)
231
if sha in object_iter:
232
return object_iter[sha]
233
return target_git_object_retriever[sha]
163
234
parent_invs = [repo.get_inventory(r) for r in rev.parent_ids]
164
import_git_tree(repo, mapping, "", root_tree, inv, parent_invs, lookup_object)
235
import_git_tree(repo.texts, mapping, "", root_tree, inv, parent_invs,
236
target_git_object_retriever._idmap, lookup_object)
165
237
repo.add_revision(rev.revision_id, rev, inv)
168
def reconstruct_git_commit(repo, rev):
169
raise NotImplementedError(self.reconstruct_git_commit)
172
def reconstruct_git_object(repo, mapping, sha):
174
revid = mapping.revision_id_foreign_to_bzr(sha)
176
rev = repo.get_revision(revid)
177
except NoSuchRevision:
180
return reconstruct_git_commit(rev)
184
raise KeyError("No such object %s" % sha)
187
class InterGitRepository(InterRepository):
189
_matching_repo_format = GitFormat()
238
target_git_object_retriever._idmap.commit()
241
class InterGitNonGitRepository(InterRepository):
242
"""InterRepository that copies revisions from a Git into a non-Git
245
_matching_repo_format = GitRepositoryFormat()
192
248
def _get_repo_format_to_test():
196
252
"""See InterRepository.copy_content."""
197
253
self.fetch(revision_id, pb, find_ghosts=False)
199
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
202
mapping = self.source.get_mapping()
255
def fetch_objects(self, determine_wants, mapping, pb=None):
203
256
def progress(text):
204
pb.note("git: %s", text)
205
def determine_wants(heads):
206
if revision_id is None:
209
ret = [mapping.revision_id_bzr_to_foreign(revision_id)]
210
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
257
pb.update("git: %s" % text.rstrip("\r\n"), 0, 0)
211
258
graph_walker = BzrFetchGraphWalker(self.target, mapping)
214
261
create_pb = pb = ui.ui_factory.nested_progress_bar()
262
target_git_object_retriever = GitObjectConverter(self.target, mapping)
265
def record_determine_wants(heads):
266
wants = determine_wants(heads)
267
recorded_wants.extend(wants)
216
271
self.target.lock_write()
218
273
self.target.start_write_group()
220
import_git_objects(self.target, mapping,
221
iter(self.source.fetch_objects(determine_wants, graph_walker,
275
objects_iter = self.source.fetch_objects(
276
record_determine_wants,
278
target_git_object_retriever.__getitem__,
280
import_git_objects(self.target, mapping, objects_iter,
281
target_git_object_retriever, recorded_wants, pb)
224
283
self.target.commit_write_group()
229
288
create_pb.finished()
290
def fetch(self, revision_id=None, pb=None, find_ghosts=False, mapping=None,
292
self.fetch_refs(revision_id=revision_id, pb=pb, find_ghosts=find_ghosts,
293
mapping=mapping, fetch_spec=fetch_spec)
295
def fetch_refs(self, revision_id=None, pb=None, find_ghosts=False,
296
mapping=None, fetch_spec=None):
298
mapping = self.source.get_mapping()
299
if revision_id is not None:
300
interesting_heads = [revision_id]
301
elif fetch_spec is not None:
302
interesting_heads = fetch_spec.heads
304
interesting_heads = None
306
def determine_wants(refs):
308
if interesting_heads is None:
309
ret = [sha for (ref, sha) in refs.iteritems() if not ref.endswith("^{}")]
311
ret = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in interesting_heads]
312
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
313
self.fetch_objects(determine_wants, mapping, pb)
232
317
def is_compatible(source, target):
233
318
"""Be compatible with GitRepository."""
234
319
# FIXME: Also check target uses VersionedFile
235
320
return (isinstance(source, GitRepository) and
236
target.supports_rich_root())
321
target.supports_rich_root() and
322
not isinstance(target, GitRepository))
325
class InterGitRepository(InterRepository):
326
"""InterRepository that copies between Git repositories."""
328
_matching_repo_format = GitRepositoryFormat()
331
def _get_repo_format_to_test():
334
def copy_content(self, revision_id=None, pb=None):
335
"""See InterRepository.copy_content."""
336
self.fetch(revision_id, pb, find_ghosts=False)
338
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
339
mapping=None, fetch_spec=None):
341
mapping = self.source.get_mapping()
343
trace.info("git: %s", text)
345
if revision_id is not None:
346
args = [mapping.revision_id_bzr_to_foreign(revision_id)[0]]
347
elif fetch_spec is not None:
348
args = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in fetch_spec.heads]
349
if fetch_spec is None and revision_id is None:
350
determine_wants = r.object_store.determine_wants_all
352
determine_wants = lambda x: [y for y in args if not y in r.object_store]
354
graphwalker = SimpleFetchGraphWalker(r.heads().values(), r.get_parents)
355
f, commit = r.object_store.add_pack()
357
self.source._git.fetch_pack(path, determine_wants, graphwalker, f.write, progress)
365
def is_compatible(source, target):
366
"""Be compatible with GitRepository."""
367
return (isinstance(source, GitRepository) and
368
isinstance(target, GitRepository))