1
# Copyright (C) 2007 Canonical Ltd
2
# Copyright (C) 2008-2009 Jelmer Vernooij <jelmer@samba.org>
3
# Copyright (C) 2008 John Carr
1
# Copyright (C) 2007-2008 Canonical Ltd
5
3
# This program is free software; you can redistribute it and/or modify
6
4
# it under the terms of the GNU General Public License as published by
19
17
"""Converters, etc for going between Bazaar and Git ids."""
26
from bzrlib.inventory import (
19
from bzrlib import errors, foreign
20
from bzrlib.inventory import ROOT_ID
29
21
from bzrlib.foreign import (
34
from bzrlib.plugins.git.foreign import (
35
escape_commit_message,
39
27
def escape_file_id(file_id):
40
28
return file_id.replace('_', '__').replace(' ', '_s')
67
55
return bzr_rev_id[len(cls.revid_prefix)+1:], cls()
69
57
def generate_file_id(self, path):
70
# Git paths are just bytestrings
71
# We must just hope they are valid UTF-8..
72
assert isinstance(path, str)
75
return escape_file_id(path)
77
def parse_file_id(self, file_id):
78
if file_id == ROOT_ID:
80
return unescape_file_id(file_id)
60
return escape_file_id(path.encode('utf-8'))
82
62
def import_commit(self, commit):
83
63
"""Convert a git commit to a bzr revision.
88
68
raise AssertionError("Commit object can't be None")
89
69
rev = ForeignRevision(commit.id, self, self.revision_id_foreign_to_bzr(commit.id))
90
70
rev.parent_ids = tuple([self.revision_id_foreign_to_bzr(p) for p in commit.parents])
91
rev.message = escape_commit_message(commit.message.decode("utf-8", "replace"))
92
rev.committer = escape_commit_message(str(commit.committer).decode("utf-8", "replace"))
71
rev.message = commit.message.decode("utf-8", "replace")
72
rev.committer = str(commit.committer).decode("utf-8", "replace")
93
73
if commit.committer != commit.author:
94
rev.properties['author'] = escape_commit_message(str(commit.author).decode("utf-8", "replace"))
74
rev.properties['author'] = str(commit.author).decode("utf-8", "replace")
95
75
rev.timestamp = commit.commit_time
79
def export_commit(self, rev, tree_sha):
80
"""Turn a Bazaar revision in to a Git commit
82
:param tree_sha: HACK parameter (until we can retrieve this from the mapping)
83
:return dulwich.objects.Commit represent the revision:
85
from dulwich.objects import Commit
87
commit._tree = tree_sha
88
for p in rev.parent_ids:
89
commit._parents.append(self.revision_id_bzr_to_foreign(p))
90
commit._message = rev.message
91
commit._committer = rev.committer
92
if 'author' in rev.properties:
93
commit._author = rev.properties['author']
95
commit._author = rev.committer
96
commit._commit_time = long(rev.timestamp)
100
101
class BzrGitMappingv1(BzrGitMapping):
101
102
revid_prefix = 'git-v1'
140
141
foreign_git = ForeignGit()
141
142
default_mapping = BzrGitMappingv1()
144
def text_to_blob(text):
145
from dulwich.objects import Blob
151
def inventory_to_tree_and_blobs(repo, mapping, revision_id):
152
from dulwich.objects import Tree
153
from bzrlib.inventory import InventoryDirectory, InventoryFile
159
inv = repo.get_inventory(revision_id)
161
# stack contains the set of trees that we haven't
162
# finished constructing
163
for path, entry in inv.iter_entries():
164
while stack and not path.startswith(cur):
168
t = (stat.S_IFDIR, urlutils.basename(cur).encode('UTF-8'), sha)
169
cur, tree = stack.pop()
172
if type(entry) == InventoryDirectory:
173
stack.append((cur, tree))
177
if type(entry) == InventoryFile:
178
#FIXME: We can make potentially make this Lazy to avoid shaing lots of stuff
179
# and having all these objects in memory at once
180
text = repo.texts.get_record_stream([(entry.file_id, entry.revision)], 'unordered', True).next().get_bytes_as('fulltext')
181
blob = text_to_blob(text)
183
yield sha, blob, path
185
name = urlutils.basename(path).encode("utf-8")
186
mode = stat.S_IFREG | 0644
189
tree.add(mode, name, sha)
191
while len(stack) > 1:
195
t = (stat.S_IFDIR, urlutils.basename(cur).encode('UTF-8'), sha)
196
cur, tree = stack.pop()
200
yield tree.id, tree, cur
203
def revision_to_commit(rev, tree_sha, parent_lookup):
204
"""Turn a Bazaar revision in to a Git commit
206
:param tree_sha: Tree sha for the commit
207
:param parent_lookup: Function for looking up the GIT sha equiv of a bzr revision
208
:return dulwich.objects.Commit represent the revision:
210
from dulwich.objects import Commit
212
commit._tree = tree_sha
213
for p in rev.parent_ids:
214
git_p = parent_lookup(p)
215
if git_p is not None:
216
assert len(git_p) == 40, "unexpected length for %r" % git_p
217
commit._parents.append(git_p)
218
commit._message = rev.message.encode("utf-8")
219
commit._committer = rev.committer.encode("utf-8")
220
commit._author = rev.get_apparent_authors()[0].encode("utf-8")
221
commit._commit_time = long(rev.timestamp)