41
50
self.mapping = self.repository.get_mapping()
43
52
self.mapping = mapping
44
self._idmap = GitShaMap(self.repository._transport)
46
def _update_sha_map(self):
47
all_revids = self.repository.all_revision_ids()
53
self._idmap = SqliteGitShaMap.from_repository(repository)
55
def iter_shas(self, shas):
56
return ObjectStoreIterator(self, shas)
58
def _update_sha_map(self, stop_revision=None):
59
if stop_revision is None:
60
all_revids = self.repository.all_revision_ids()
62
all_revids = self.repository.get_ancestry(stop_revision)
63
first = all_revids.pop(0) # Pop leading None
48
65
graph = self.repository.get_graph()
49
66
present_revids = set(self._idmap.revids())
67
missing_revids = [revid for revid in graph.iter_topo_order(all_revids) if revid not in present_revids]
50
68
pb = ui.ui_factory.nested_progress_bar()
52
for i, revid in enumerate(graph.iter_topo_order(all_revids)):
53
if revid in present_revids:
55
pb.update("updating git map", i, len(all_revids))
70
for i, revid in enumerate(missing_revids):
71
pb.update("updating git map", i, len(missing_revids))
56
72
self._update_sha_map_revision(revid)
78
self._update_sha_map()
79
return iter(self._idmap.sha1s())
60
81
def _update_sha_map_revision(self, revid):
61
82
inv = self.repository.get_inventory(revid)
62
objects = inventory_to_tree_and_blobs(self.repository, self.mapping, revid)
63
for sha, o, path in objects:
66
ie = inv[inv.path2id(path)]
67
if ie.kind in ("file", "symlink"):
68
self._idmap.add_entry(sha, "blob", (ie.file_id, ie.revision))
70
self._idmap.add_entry(sha, "tree", (ie.file_id, ie.revision))
83
tree_sha = self._get_ie_sha1(inv.root, inv)
71
84
rev = self.repository.get_revision(revid)
72
commit_obj = revision_to_commit(rev, tree_sha, self._idmap._parent_lookup)
73
self._idmap.add_entry(commit_obj.sha().hexdigest(), "commit", (revid, tree_sha))
75
def _get_blob(self, fileid, revision):
76
text = self.repository.texts.get_record_stream([(fileid, revision)], "unordered", True).next().get_bytes_as("fulltext")
85
commit_obj = revision_to_commit(rev, tree_sha,
86
self._idmap._parent_lookup)
88
foreign_revid, mapping = mapping_registry.parse_revision_id(revid)
89
except errors.InvalidRevisionId:
92
if foreign_revid != commit_obj.id:
93
if not "fix-shamap" in debug.debug_flags:
94
raise AssertionError("recreated git commit had different sha1: expected %s, got %s" % (foreign_revid, commit_obj.id))
95
self._idmap.add_entry(commit_obj.id, "commit", (revid, tree_sha))
97
def _check_expected_sha(self, expected_sha, object):
98
if expected_sha is None:
100
if expected_sha != object.id:
101
raise AssertionError("Invalid sha for %r: %s" % (object, expected_sha))
103
def _get_ie_object(self, entry, inv):
104
if entry.kind == "directory":
105
return self._get_tree(entry.file_id, inv.revision_id, inv=inv)
107
return self._get_blob(entry.file_id, entry.revision)
109
def _get_ie_object_or_sha1(self, entry, inv):
110
if entry.kind == "directory":
112
return self._idmap.lookup_tree(entry.file_id, inv.revision_id), None
114
ret = self._get_ie_object(entry, inv)
115
self._idmap.add_entry(ret.id, "tree", (entry.file_id, inv.revision_id))
119
return self._idmap.lookup_blob(entry.file_id, entry.revision), None
121
ret = self._get_ie_object(entry, inv)
122
self._idmap.add_entry(ret.id, "blob", (entry.file_id, entry.revision))
125
def _get_ie_sha1(self, entry, inv):
126
return self._get_ie_object_or_sha1(entry, inv)[0]
128
def _get_blob(self, fileid, revision, expected_sha=None):
129
"""Return a Git Blob object from a fileid and revision stored in bzr.
131
:param fileid: File id of the text
132
:param revision: Revision of the text
134
text = self.repository.texts.get_record_stream([(fileid, revision)],
135
"unordered", True).next().get_bytes_as("fulltext")
138
self._check_expected_sha(expected_sha, blob)
81
def _get_tree(self, fileid, revid):
82
raise NotImplementedError(self._get_tree)
84
def _get_commit(self, revid, tree_sha):
141
def _get_tree(self, fileid, revid, inv=None, expected_sha=None):
142
"""Return a Git Tree object from a file id and a revision stored in bzr.
144
:param fileid: fileid in the tree.
145
:param revision: Revision of the tree.
148
inv = self.repository.get_inventory(revid)
149
tree = directory_to_tree(inv[fileid], lambda ie: self._get_ie_sha1(ie, inv))
150
self._check_expected_sha(expected_sha, tree)
153
def _get_commit(self, revid, tree_sha, expected_sha=None):
85
154
rev = self.repository.get_revision(revid)
86
return revision_to_commit(rev, tree_sha, self._idmap._parent_lookup)
88
def __getitem__(self, sha):
89
# See if sha is in map
91
(type, type_data) = self._idmap.lookup_git_sha(sha)
155
commit = revision_to_commit(rev, tree_sha, self._lookup_revision_sha1)
156
self._check_expected_sha(expected_sha, commit)
159
def get_parents(self, sha):
160
return self[sha].parents
162
def _lookup_revision_sha1(self, revid):
164
return self._idmap._parent_lookup(revid)
166
inv = self.repository.get_inventory(revid)
167
tree_sha = self._get_ie_sha1(inv.root, inv)
168
ret = self._get_commit(revid, tree_sha).id
169
self._idmap.add_entry(ret, "commit", (revid, tree_sha))
172
def get_raw(self, sha):
173
return self[sha].as_raw_string()
175
def __contains__(self, sha):
176
# See if sha is in map
178
self._lookup_git_sha(sha)
184
def _lookup_git_sha(self, sha):
185
# See if sha is in map
187
return self._idmap.lookup_git_sha(sha)
93
189
# if not, see if there are any unconverted revisions and add them
94
190
# to the map, search for sha in map again
95
191
self._update_sha_map()
96
(type, type_data) = self._idmap.lookup_git_sha(sha)
192
return self._idmap.lookup_git_sha(sha)
194
def __getitem__(self, sha):
195
(type, type_data) = self._lookup_git_sha(sha)
97
196
# convert object to git object
98
197
if type == "commit":
99
return self._get_commit(*type_data)
198
return self._get_commit(type_data[0], type_data[1],
100
200
elif type == "blob":
101
return self._get_blob(*type_data)
201
return self._get_blob(type_data[0], type_data[1], expected_sha=sha)
102
202
elif type == "tree":
103
return self._get_tree(*type_data)
203
return self._get_tree(type_data[0], type_data[1], expected_sha=sha)
105
205
raise AssertionError("Unknown object type '%s'" % type)