14
14
# along with this program; if not, write to the Free Software
15
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
from cStringIO import (
21
from dulwich.client import (
22
SimpleFetchGraphWalker,
24
from dulwich.objects import (
35
from bzrlib.errors import (
39
from bzrlib.inventory import (
45
from bzrlib.lru_cache import (
48
from bzrlib.repository import (
51
from bzrlib.revision import (
54
from bzrlib.tsort import (
58
from bzrlib.plugins.git.converter import (
17
from bzrlib import osutils, ui, urlutils
18
from bzrlib.errors import InvalidRevisionId
19
from bzrlib.inventory import Inventory
20
from bzrlib.repository import InterRepository
21
from bzrlib.trace import info
22
from bzrlib.tsort import topo_sort
24
from bzrlib.plugins.git import git
61
25
from bzrlib.plugins.git.repository import (
66
from bzrlib.plugins.git.remote import (
30
from bzrlib.plugins.git.remote import RemoteGitRepository
32
from dulwich.objects import Commit
34
from cStringIO import StringIO
71
37
class BzrFetchGraphWalker(object):
72
"""GraphWalker implementation that uses a Bazaar repository."""
74
39
def __init__(self, repository, mapping):
75
40
self.repository = repository
101
63
self.heads.update([p for p in ps if not p in self.done])
103
65
self.done.add(ret)
104
return self.mapping.revision_id_bzr_to_foreign(ret)[0]
66
return self.mapping.revision_id_bzr_to_foreign(ret)
105
67
except InvalidRevisionId:
110
def import_git_blob(texts, mapping, path, blob, base_inv, parent_id,
111
revision_id, parent_invs, shagitmap, executable):
72
def import_git_blob(repo, mapping, path, blob, inv, parent_invs, executable):
112
73
"""Import a git blob object into a bzr repository.
114
:param texts: VersionedFiles to add to
75
:param repo: bzr repository
115
76
:param path: Path in the tree
116
77
:param blob: A git blob
117
:return: Inventory delta for this file
119
79
file_id = mapping.generate_file_id(path)
120
# We just have to hope this is indeed utf-8:
121
ie = InventoryFile(file_id, urlutils.basename(path).decode("utf-8"),
80
text_revision = inv.revision_id
81
repo.texts.add_lines((file_id, text_revision),
82
[(file_id, p[file_id].revision) for p in parent_invs if file_id in p],
83
osutils.split_lines(blob.data))
84
ie = inv.add_path(path, "file", file_id)
85
ie.revision = text_revision
123
86
ie.text_size = len(blob.data)
124
87
ie.text_sha1 = osutils.sha_string(blob.data)
125
88
ie.executable = executable
126
# If there were no changes compared to the base inventory, there's no need
128
if (file_id in base_inv and
129
base_inv[file_id].parent_id == ie.parent_id and
130
base_inv[file_id].text_sha1 == ie.text_sha1 and
131
base_inv[file_id].executable == ie.executable):
133
# Check what revision we should store
135
for pinv in parent_invs:
136
if not file_id in pinv:
138
if pinv[file_id].text_sha1 == ie.text_sha1:
139
# found a revision in one of the parents to use
140
ie.revision = pinv[file_id].revision
142
parent_keys.append((file_id, pinv[file_id].revision))
143
if ie.revision is None:
144
# Need to store a new revision
145
ie.revision = revision_id
146
assert file_id is not None
147
assert ie.revision is not None
148
texts.add_lines((file_id, ie.revision), parent_keys,
149
osutils.split_lines(blob.data))
150
shagitmap.add_entry(blob.sha().hexdigest(), "blob",
151
(ie.file_id, ie.revision))
152
if file_id in base_inv:
153
old_path = base_inv.id2path(file_id)
156
return [(old_path, path, file_id, ie)]
159
def import_git_tree(texts, mapping, path, tree, base_inv, parent_id,
160
revision_id, parent_invs, shagitmap, lookup_object):
91
def import_git_tree(repo, mapping, path, tree, inv, parent_invs, lookup_object):
161
92
"""Import a git tree object into a bzr repository.
163
:param texts: VersionedFiles object to add to
94
:param repo: A Bzr repository object
164
95
:param path: Path in the tree
165
96
:param tree: A git tree object
166
:param base_inv: Base inventory against which to return inventory delta
167
:return: Inventory delta for this subtree
97
:param inv: Inventory object
170
99
file_id = mapping.generate_file_id(path)
171
# We just have to hope this is indeed utf-8:
172
ie = InventoryDirectory(file_id, urlutils.basename(path.decode("utf-8")),
174
if not file_id in base_inv:
175
# Newly appeared here
176
ie.revision = revision_id
177
texts.add_lines((file_id, ie.revision), [], [])
178
ret.append((None, path, file_id, ie))
180
# See if this has changed at all
182
base_sha = shagitmap.lookup_tree(path, base_inv.revision_id)
186
if base_sha == tree.id:
187
# If nothing has changed since the base revision, we're done
189
# Remember for next time
190
existing_children = set()
191
shagitmap.add_entry(tree.id, "tree", (file_id, revision_id))
100
text_revision = inv.revision_id
101
repo.texts.add_lines((file_id, text_revision),
102
[(file_id, p[file_id].revision) for p in parent_invs if file_id in p],
104
ie = inv.add_path(path, "directory", file_id)
105
ie.revision = text_revision
192
106
for mode, name, hexsha in tree.entries():
193
107
entry_kind = (mode & 0700000) / 0100000
194
108
basename = name.decode("utf-8")
195
existing_children.add(basename)
197
110
child_path = name
199
112
child_path = urlutils.join(path, name)
200
obj = lookup_object(hexsha)
201
113
if entry_kind == 0:
202
ret.extend(import_git_tree(texts, mapping, child_path, obj, base_inv,
203
file_id, revision_id, parent_invs, shagitmap, lookup_object))
114
tree = lookup_object(hexsha)
115
import_git_tree(repo, mapping, child_path, tree, inv, parent_invs, lookup_object)
204
116
elif entry_kind == 1:
117
blob = lookup_object(hexsha)
205
118
fs_mode = mode & 0777
206
ret.extend(import_git_blob(texts, mapping, child_path, obj, base_inv,
207
file_id, revision_id, parent_invs, shagitmap,
208
bool(fs_mode & 0111)))
119
import_git_blob(repo, mapping, child_path, blob, inv, parent_invs, bool(fs_mode & 0111))
210
121
raise AssertionError("Unknown blob kind, perms=%r." % (mode,))
211
# Remove any children that have disappeared
212
if file_id in base_inv:
213
deletable = [v for k,v in base_inv[file_id].children.iteritems() if k not in existing_children]
216
ret.append((base_inv.id2path(ie.file_id), None, ie.file_id, None))
217
if ie.kind == "directory":
218
deletable.extend(ie.children.values())
222
def import_git_objects(repo, mapping, object_iter, target_git_object_retriever,
124
def import_git_objects(repo, mapping, object_iter, pb=None):
224
125
"""Import a set of git objects into a bzr repository.
226
127
:param repo: Bazaar repository
228
129
:param object_iter: Iterator over Git objects.
230
131
# TODO: a more (memory-)efficient implementation of this
133
for i, o in enumerate(object_iter):
135
pb.update("fetching objects", i)
236
parent_invs_cache = LRUCache(50)
237
140
# Find and convert commit objects
240
pb.update("finding revisions to fetch", len(graph), None)
242
assert isinstance(head, str)
243
o = object_iter[head]
141
for o in objects.itervalues():
244
142
if isinstance(o, Commit):
245
143
rev = mapping.import_commit(o)
246
if repo.has_revision(rev.revision_id):
248
root_trees[rev.revision_id] = o.tree
144
root_trees[rev.revision_id] = objects[o.tree]
249
145
revisions[rev.revision_id] = rev
250
146
graph.append((rev.revision_id, rev.parent_ids))
251
target_git_object_retriever._idmap.add_entry(o.sha().hexdigest(),
252
"commit", (rev.revision_id, o._tree))
253
heads.extend([p for p in o.parents if p not in checked])
254
elif isinstance(o, Tag):
255
heads.append(o.object[1])
257
trace.warning("Unable to import head object %r" % o)
259
147
# Order the revisions
260
148
# Create the inventory objects
261
149
for i, revid in enumerate(topo_sort(graph)):
262
150
if pb is not None:
263
151
pb.update("fetching revisions", i, len(graph))
264
root_tree = object_iter[root_trees[revid]]
152
root_tree = root_trees[revid]
265
153
rev = revisions[revid]
266
154
# We have to do this here, since we have to walk the tree and
267
# we need to make sure to import the blobs / trees with the right
155
# we need to make sure to import the blobs / trees with the riht
268
156
# path; this may involve adding them more than once.
158
inv.revision_id = rev.revision_id
269
159
def lookup_object(sha):
271
return object_iter[sha]
273
return target_git_object_retriever[sha]
275
for parent_id in rev.parent_ids:
277
parent_invs.append(parent_invs_cache[parent_id])
279
parent_inv = repo.get_inventory(parent_id)
280
parent_invs.append(parent_inv)
281
parent_invs_cache[parent_id] = parent_inv
282
if parent_invs == []:
283
base_inv = Inventory(root_id=None)
285
base_inv = parent_invs[0]
286
inv_delta = import_git_tree(repo.texts, mapping, "", root_tree,
287
base_inv, None, revid, parent_invs,
288
target_git_object_retriever._idmap, lookup_object)
290
basis_id = rev.parent_ids[0]
292
basis_id = NULL_REVISION
293
rev.inventory_sha1, inv = repo.add_inventory_by_delta(basis_id,
294
inv_delta, rev.revision_id, rev.parent_ids)
295
parent_invs_cache[rev.revision_id] = inv
296
repo.add_revision(rev.revision_id, rev)
297
target_git_object_retriever._idmap.commit()
300
class InterGitNonGitRepository(InterRepository):
301
"""InterRepository that copies revisions from a Git into a non-Git
304
_matching_repo_format = GitRepositoryFormat()
162
return reconstruct_git_object(repo, mapping, sha)
163
parent_invs = [repo.get_inventory(r) for r in rev.parent_ids]
164
import_git_tree(repo, mapping, "", root_tree, inv, parent_invs, lookup_object)
165
repo.add_revision(rev.revision_id, rev, inv)
168
def reconstruct_git_commit(repo, rev):
169
raise NotImplementedError(self.reconstruct_git_commit)
172
def reconstruct_git_object(repo, mapping, sha):
174
revid = mapping.revision_id_foreign_to_bzr(sha)
176
rev = repo.get_revision(revid)
177
except NoSuchRevision:
180
return reconstruct_git_commit(rev)
184
raise KeyError("No such object %s" % sha)
187
class InterGitRepository(InterRepository):
189
_matching_repo_format = GitFormat()
307
192
def _get_repo_format_to_test():
311
196
"""See InterRepository.copy_content."""
312
197
self.fetch(revision_id, pb, find_ghosts=False)
314
def fetch_objects(self, determine_wants, mapping, pb=None):
199
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
202
mapping = self.source.get_mapping()
315
203
def progress(text):
316
pb.update("git: %s" % text.rstrip("\r\n"), 0, 0)
204
pb.note("git: %s", text)
205
def determine_wants(heads):
206
if revision_id is None:
209
ret = [mapping.revision_id_bzr_to_foreign(revision_id)]
210
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
317
211
graph_walker = BzrFetchGraphWalker(self.target, mapping)
320
214
create_pb = pb = ui.ui_factory.nested_progress_bar()
321
target_git_object_retriever = GitObjectConverter(self.target, mapping)
324
def record_determine_wants(heads):
325
wants = determine_wants(heads)
326
recorded_wants.extend(wants)
330
216
self.target.lock_write()
332
218
self.target.start_write_group()
334
objects_iter = self.source.fetch_objects(
335
record_determine_wants,
337
target_git_object_retriever.__getitem__,
339
import_git_objects(self.target, mapping, objects_iter,
340
target_git_object_retriever, recorded_wants, pb)
220
import_git_objects(self.target, mapping,
221
iter(self.source.fetch_objects(determine_wants, graph_walker,
342
224
self.target.commit_write_group()
347
229
create_pb.finished()
349
def fetch(self, revision_id=None, pb=None, find_ghosts=False, mapping=None,
351
self.fetch_refs(revision_id=revision_id, pb=pb, find_ghosts=find_ghosts,
352
mapping=mapping, fetch_spec=fetch_spec)
354
def fetch_refs(self, revision_id=None, pb=None, find_ghosts=False,
355
mapping=None, fetch_spec=None):
357
mapping = self.source.get_mapping()
358
if revision_id is not None:
359
interesting_heads = [revision_id]
360
elif fetch_spec is not None:
361
interesting_heads = fetch_spec.heads
363
interesting_heads = None
365
def determine_wants(refs):
367
if interesting_heads is None:
368
ret = [sha for (ref, sha) in refs.iteritems() if not ref.endswith("^{}")]
370
ret = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in interesting_heads]
371
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
372
self.fetch_objects(determine_wants, mapping, pb)
376
232
def is_compatible(source, target):
377
233
"""Be compatible with GitRepository."""
378
234
# FIXME: Also check target uses VersionedFile
379
235
return (isinstance(source, GitRepository) and
380
target.supports_rich_root() and
381
not isinstance(target, GitRepository))
384
class InterGitRepository(InterRepository):
385
"""InterRepository that copies between Git repositories."""
387
_matching_repo_format = GitRepositoryFormat()
390
def _get_repo_format_to_test():
393
def copy_content(self, revision_id=None, pb=None):
394
"""See InterRepository.copy_content."""
395
self.fetch(revision_id, pb, find_ghosts=False)
397
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
398
mapping=None, fetch_spec=None):
400
mapping = self.source.get_mapping()
402
trace.info("git: %s", text)
404
if revision_id is not None:
405
args = [mapping.revision_id_bzr_to_foreign(revision_id)[0]]
406
elif fetch_spec is not None:
407
args = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in fetch_spec.heads]
408
if fetch_spec is None and revision_id is None:
409
determine_wants = r.object_store.determine_wants_all
411
determine_wants = lambda x: [y for y in args if not y in r.object_store]
413
graphwalker = SimpleFetchGraphWalker(r.heads().values(), r.get_parents)
414
f, commit = r.object_store.add_pack()
416
self.source._git.fetch_pack(path, determine_wants, graphwalker, f.write, progress)
424
def is_compatible(source, target):
425
"""Be compatible with GitRepository."""
426
return (isinstance(source, GitRepository) and
427
isinstance(target, GitRepository))
236
target.supports_rich_root())