14
14
# along with this program; if not, write to the Free Software
15
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
from bzrlib import osutils, ui, urlutils
18
from bzrlib.errors import InvalidRevisionId
19
from bzrlib.inventory import Inventory
20
from bzrlib.repository import InterRepository
21
from bzrlib.trace import info
22
from bzrlib.tsort import topo_sort
24
from bzrlib.plugins.git import git
17
from cStringIO import (
21
from dulwich.client import (
22
SimpleFetchGraphWalker,
24
from dulwich.objects import (
35
from bzrlib.errors import (
39
from bzrlib.inventory import (
45
from bzrlib.lru_cache import (
48
from bzrlib.repository import (
51
from bzrlib.revision import (
54
from bzrlib.tsort import (
58
from bzrlib.plugins.git.converter import (
25
61
from bzrlib.plugins.git.repository import (
30
from bzrlib.plugins.git.remote import RemoteGitRepository
32
from dulwich.objects import Commit
34
from cStringIO import StringIO
66
from bzrlib.plugins.git.remote import (
37
71
class BzrFetchGraphWalker(object):
72
"""GraphWalker implementation that uses a Bazaar repository."""
39
74
def __init__(self, repository, mapping):
40
75
self.repository = repository
63
101
self.heads.update([p for p in ps if not p in self.done])
65
103
self.done.add(ret)
66
return self.mapping.revision_id_bzr_to_foreign(ret)
104
return self.mapping.revision_id_bzr_to_foreign(ret)[0]
67
105
except InvalidRevisionId:
72
def import_git_blob(repo, mapping, path, blob, inv, parent_invs, executable):
110
def import_git_blob(texts, mapping, path, blob, base_inv, parent_id,
111
revision_id, parent_invs, shagitmap, executable):
73
112
"""Import a git blob object into a bzr repository.
75
:param repo: bzr repository
114
:param texts: VersionedFiles to add to
76
115
:param path: Path in the tree
77
116
:param blob: A git blob
117
:return: Inventory delta for this file
79
119
file_id = mapping.generate_file_id(path)
80
text_revision = inv.revision_id
81
repo.texts.add_lines((file_id, text_revision),
82
[(file_id, p[file_id].revision) for p in parent_invs if file_id in p],
83
osutils.split_lines(blob.data))
84
ie = inv.add_path(path, "file", file_id)
85
ie.revision = text_revision
120
# We just have to hope this is indeed utf-8:
121
ie = InventoryFile(file_id, urlutils.basename(path).decode("utf-8"),
86
123
ie.text_size = len(blob.data)
87
124
ie.text_sha1 = osutils.sha_string(blob.data)
88
125
ie.executable = executable
91
def import_git_tree(repo, mapping, path, tree, inv, parent_invs, lookup_object):
126
# If there were no changes compared to the base inventory, there's no need
128
if (file_id in base_inv and
129
base_inv[file_id].parent_id == ie.parent_id and
130
base_inv[file_id].text_sha1 == ie.text_sha1 and
131
base_inv[file_id].executable == ie.executable):
133
# Check what revision we should store
135
for pinv in parent_invs:
136
if not file_id in pinv:
138
if pinv[file_id].text_sha1 == ie.text_sha1:
139
# found a revision in one of the parents to use
140
ie.revision = pinv[file_id].revision
142
parent_keys.append((file_id, pinv[file_id].revision))
143
if ie.revision is None:
144
# Need to store a new revision
145
ie.revision = revision_id
146
assert file_id is not None
147
assert ie.revision is not None
148
texts.add_lines((file_id, ie.revision), parent_keys,
149
osutils.split_lines(blob.data))
150
shagitmap.add_entry(blob.sha().hexdigest(), "blob",
151
(ie.file_id, ie.revision))
152
if file_id in base_inv:
153
old_path = base_inv.id2path(file_id)
156
return [(old_path, path, file_id, ie)]
159
def import_git_tree(texts, mapping, path, tree, base_inv, parent_id,
160
revision_id, parent_invs, shagitmap, lookup_object):
92
161
"""Import a git tree object into a bzr repository.
94
:param repo: A Bzr repository object
163
:param texts: VersionedFiles object to add to
95
164
:param path: Path in the tree
96
165
:param tree: A git tree object
97
:param inv: Inventory object
166
:param base_inv: Base inventory against which to return inventory delta
167
:return: Inventory delta for this subtree
99
170
file_id = mapping.generate_file_id(path)
100
text_revision = inv.revision_id
101
repo.texts.add_lines((file_id, text_revision),
102
[(file_id, p[file_id].revision) for p in parent_invs if file_id in p],
104
ie = inv.add_path(path, "directory", file_id)
105
ie.revision = text_revision
171
# We just have to hope this is indeed utf-8:
172
ie = InventoryDirectory(file_id, urlutils.basename(path.decode("utf-8")),
174
if not file_id in base_inv:
175
# Newly appeared here
176
ie.revision = revision_id
177
texts.add_lines((file_id, ie.revision), [], [])
178
ret.append((None, path, file_id, ie))
180
# See if this has changed at all
182
base_sha = shagitmap.lookup_tree(path, base_inv.revision_id)
186
if base_sha == tree.id:
187
# If nothing has changed since the base revision, we're done
189
# Remember for next time
190
existing_children = set()
191
shagitmap.add_entry(tree.id, "tree", (file_id, revision_id))
106
192
for mode, name, hexsha in tree.entries():
107
193
entry_kind = (mode & 0700000) / 0100000
108
194
basename = name.decode("utf-8")
195
existing_children.add(basename)
110
197
child_path = name
112
199
child_path = urlutils.join(path, name)
200
obj = lookup_object(hexsha)
113
201
if entry_kind == 0:
114
tree = lookup_object(hexsha)
115
import_git_tree(repo, mapping, child_path, tree, inv, parent_invs, lookup_object)
202
ret.extend(import_git_tree(texts, mapping, child_path, obj, base_inv,
203
file_id, revision_id, parent_invs, shagitmap, lookup_object))
116
204
elif entry_kind == 1:
117
blob = lookup_object(hexsha)
118
205
fs_mode = mode & 0777
119
import_git_blob(repo, mapping, child_path, blob, inv, parent_invs, bool(fs_mode & 0111))
206
ret.extend(import_git_blob(texts, mapping, child_path, obj, base_inv,
207
file_id, revision_id, parent_invs, shagitmap,
208
bool(fs_mode & 0111)))
121
210
raise AssertionError("Unknown blob kind, perms=%r." % (mode,))
124
def import_git_objects(repo, mapping, object_iter, pb=None):
211
# Remove any children that have disappeared
212
if file_id in base_inv:
213
deletable = [v for k,v in base_inv[file_id].children.iteritems() if k not in existing_children]
216
ret.append((base_inv.id2path(ie.file_id), None, ie.file_id, None))
217
if ie.kind == "directory":
218
deletable.extend(ie.children.values())
222
def import_git_objects(repo, mapping, object_iter, target_git_object_retriever,
125
224
"""Import a set of git objects into a bzr repository.
127
226
:param repo: Bazaar repository
129
228
:param object_iter: Iterator over Git objects.
131
230
# TODO: a more (memory-)efficient implementation of this
133
for i, o in enumerate(object_iter):
135
pb.update("fetching objects", i)
236
parent_invs_cache = LRUCache(50)
140
237
# Find and convert commit objects
141
for o in objects.itervalues():
240
pb.update("finding revisions to fetch", len(graph), None)
242
assert isinstance(head, str)
243
o = object_iter[head]
142
244
if isinstance(o, Commit):
143
245
rev = mapping.import_commit(o)
144
root_trees[rev.revision_id] = objects[o.tree]
246
if repo.has_revision(rev.revision_id):
248
root_trees[rev.revision_id] = o.tree
145
249
revisions[rev.revision_id] = rev
146
250
graph.append((rev.revision_id, rev.parent_ids))
251
target_git_object_retriever._idmap.add_entry(o.sha().hexdigest(),
252
"commit", (rev.revision_id, o._tree))
253
heads.extend([p for p in o.parents if p not in checked])
254
elif isinstance(o, Tag):
255
heads.append(o.object[1])
257
trace.warning("Unable to import head object %r" % o)
147
259
# Order the revisions
148
260
# Create the inventory objects
149
261
for i, revid in enumerate(topo_sort(graph)):
150
262
if pb is not None:
151
263
pb.update("fetching revisions", i, len(graph))
152
root_tree = root_trees[revid]
264
root_tree = object_iter[root_trees[revid]]
153
265
rev = revisions[revid]
154
266
# We have to do this here, since we have to walk the tree and
155
# we need to make sure to import the blobs / trees with the riht
267
# we need to make sure to import the blobs / trees with the right
156
268
# path; this may involve adding them more than once.
158
inv.revision_id = rev.revision_id
159
269
def lookup_object(sha):
162
return reconstruct_git_object(repo, mapping, sha)
163
parent_invs = [repo.get_inventory(r) for r in rev.parent_ids]
164
import_git_tree(repo, mapping, "", root_tree, inv, parent_invs, lookup_object)
165
repo.add_revision(rev.revision_id, rev, inv)
168
def reconstruct_git_commit(repo, rev):
169
raise NotImplementedError(self.reconstruct_git_commit)
172
def reconstruct_git_object(repo, mapping, sha):
174
revid = mapping.revision_id_foreign_to_bzr(sha)
176
rev = repo.get_revision(revid)
177
except NoSuchRevision:
180
return reconstruct_git_commit(rev)
184
raise KeyError("No such object %s" % sha)
187
class InterGitRepository(InterRepository):
189
_matching_repo_format = GitFormat()
271
return object_iter[sha]
273
return target_git_object_retriever[sha]
275
for parent_id in rev.parent_ids:
277
parent_invs.append(parent_invs_cache[parent_id])
279
parent_inv = repo.get_inventory(parent_id)
280
parent_invs.append(parent_inv)
281
parent_invs_cache[parent_id] = parent_inv
282
if parent_invs == []:
283
base_inv = Inventory(root_id=None)
285
base_inv = parent_invs[0]
286
inv_delta = import_git_tree(repo.texts, mapping, "", root_tree,
287
base_inv, None, revid, parent_invs,
288
target_git_object_retriever._idmap, lookup_object)
290
basis_id = rev.parent_ids[0]
292
basis_id = NULL_REVISION
293
rev.inventory_sha1, inv = repo.add_inventory_by_delta(basis_id,
294
inv_delta, rev.revision_id, rev.parent_ids)
295
parent_invs_cache[rev.revision_id] = inv
296
repo.add_revision(rev.revision_id, rev)
297
target_git_object_retriever._idmap.commit()
300
class InterGitNonGitRepository(InterRepository):
301
"""InterRepository that copies revisions from a Git into a non-Git
304
_matching_repo_format = GitRepositoryFormat()
192
307
def _get_repo_format_to_test():
196
311
"""See InterRepository.copy_content."""
197
312
self.fetch(revision_id, pb, find_ghosts=False)
199
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
202
mapping = self.source.get_mapping()
314
def fetch_objects(self, determine_wants, mapping, pb=None):
203
315
def progress(text):
204
pb.note("git: %s", text)
205
def determine_wants(heads):
206
if revision_id is None:
209
ret = [mapping.revision_id_bzr_to_foreign(revision_id)]
210
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
316
pb.update("git: %s" % text.rstrip("\r\n"), 0, 0)
211
317
graph_walker = BzrFetchGraphWalker(self.target, mapping)
214
320
create_pb = pb = ui.ui_factory.nested_progress_bar()
321
target_git_object_retriever = GitObjectConverter(self.target, mapping)
324
def record_determine_wants(heads):
325
wants = determine_wants(heads)
326
recorded_wants.extend(wants)
216
330
self.target.lock_write()
218
332
self.target.start_write_group()
220
import_git_objects(self.target, mapping,
221
iter(self.source.fetch_objects(determine_wants, graph_walker,
334
objects_iter = self.source.fetch_objects(
335
record_determine_wants,
337
target_git_object_retriever.__getitem__,
339
import_git_objects(self.target, mapping, objects_iter,
340
target_git_object_retriever, recorded_wants, pb)
224
342
self.target.commit_write_group()
229
347
create_pb.finished()
349
def fetch(self, revision_id=None, pb=None, find_ghosts=False, mapping=None,
351
self.fetch_refs(revision_id=revision_id, pb=pb, find_ghosts=find_ghosts,
352
mapping=mapping, fetch_spec=fetch_spec)
354
def fetch_refs(self, revision_id=None, pb=None, find_ghosts=False,
355
mapping=None, fetch_spec=None):
357
mapping = self.source.get_mapping()
358
if revision_id is not None:
359
interesting_heads = [revision_id]
360
elif fetch_spec is not None:
361
interesting_heads = fetch_spec.heads
363
interesting_heads = None
365
def determine_wants(refs):
367
if interesting_heads is None:
368
ret = [sha for (ref, sha) in refs.iteritems() if not ref.endswith("^{}")]
370
ret = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in interesting_heads]
371
return [rev for rev in ret if not self.target.has_revision(mapping.revision_id_foreign_to_bzr(rev))]
372
self.fetch_objects(determine_wants, mapping, pb)
232
376
def is_compatible(source, target):
233
377
"""Be compatible with GitRepository."""
234
378
# FIXME: Also check target uses VersionedFile
235
379
return (isinstance(source, GitRepository) and
236
target.supports_rich_root())
380
target.supports_rich_root() and
381
not isinstance(target, GitRepository))
384
class InterGitRepository(InterRepository):
385
"""InterRepository that copies between Git repositories."""
387
_matching_repo_format = GitRepositoryFormat()
390
def _get_repo_format_to_test():
393
def copy_content(self, revision_id=None, pb=None):
394
"""See InterRepository.copy_content."""
395
self.fetch(revision_id, pb, find_ghosts=False)
397
def fetch(self, revision_id=None, pb=None, find_ghosts=False,
398
mapping=None, fetch_spec=None):
400
mapping = self.source.get_mapping()
402
trace.info("git: %s", text)
404
if revision_id is not None:
405
args = [mapping.revision_id_bzr_to_foreign(revision_id)[0]]
406
elif fetch_spec is not None:
407
args = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in fetch_spec.heads]
408
if fetch_spec is None and revision_id is None:
409
determine_wants = r.object_store.determine_wants_all
411
determine_wants = lambda x: [y for y in args if not y in r.object_store]
413
graphwalker = SimpleFetchGraphWalker(r.heads().values(), r.get_parents)
414
f, commit = r.object_store.add_pack()
416
self.source._git.fetch_pack(path, determine_wants, graphwalker, f.write, progress)
424
def is_compatible(source, target):
425
"""Be compatible with GitRepository."""
426
return (isinstance(source, GitRepository) and
427
isinstance(target, GitRepository))