/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
0.200.910 by Jelmer Vernooij
update copyright years
1
# Copyright (C) 2008-2010 Jelmer Vernooij <jelmer@samba.org>
0.200.135 by Jelmer Vernooij
Add stub for fetching data.
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
0.200.261 by Jelmer Vernooij
More formatting fixes.
17
from dulwich.objects import (
18
    Commit,
0.200.303 by Jelmer Vernooij
Cope with tags during fetch.
19
    Tag,
0.200.814 by Jelmer Vernooij
Avoid the use of InventoryDirectory.children. This speeds up
20
    Tree,
0.200.540 by Jelmer Vernooij
Handle submodules explicitly.
21
    S_ISGITLINK,
0.200.1176 by Jelmer Vernooij
Fix fetch return value for inter git fetching.
22
    ZERO_SHA,
0.200.261 by Jelmer Vernooij
More formatting fixes.
23
    )
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
24
from dulwich.object_store import (
25
    tree_lookup_path,
26
    )
0.200.830 by Jelmer Vernooij
Bump minimum dulwich version.
27
from itertools import (
28
    imap,
29
    )
0.200.819 by Jelmer Vernooij
Avoid decoding basename twice.
30
import posixpath
0.200.563 by Jelmer Vernooij
Attempt to parse progress indication from git status reports.
31
import re
0.200.352 by Jelmer Vernooij
Simplify mode handling.
32
import stat
0.200.252 by Jelmer Vernooij
Clarify history, copyright.
33
34
from bzrlib import (
0.231.2 by Jelmer Vernooij
Add -Dverify flag (not fully implemented yet).
35
    debug,
0.200.252 by Jelmer Vernooij
Clarify history, copyright.
36
    osutils,
0.200.261 by Jelmer Vernooij
More formatting fixes.
37
    trace,
0.200.252 by Jelmer Vernooij
Clarify history, copyright.
38
    ui,
39
    )
40
from bzrlib.errors import (
0.239.5 by Jelmer Vernooij
Print user-understandable error message when encountering submodules.
41
    BzrError,
0.200.372 by Jelmer Vernooij
Fix key when looking up old sha's in cache.
42
    NoSuchId,
0.200.252 by Jelmer Vernooij
Clarify history, copyright.
43
    )
0.200.261 by Jelmer Vernooij
More formatting fixes.
44
from bzrlib.inventory import (
45
    Inventory,
0.229.2 by Jelmer Vernooij
Initial work relying on inventory deltas.
46
    InventoryDirectory,
47
    InventoryFile,
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
48
    InventoryLink,
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
49
    TreeReference,
0.200.261 by Jelmer Vernooij
More formatting fixes.
50
    )
51
from bzrlib.repository import (
52
    InterRepository,
53
    )
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
54
from bzrlib.revision import (
55
    NULL_REVISION,
56
    )
0.200.1187 by Jelmer Vernooij
Use InventoryRevisionTree.
57
try:
58
    from bzrlib.revisiontree import InventoryRevisionTree
59
except ImportError: # bzr < 2.4
60
    from bzrlib.revisiontree import RevisionTree as InventoryRevisionTree
0.200.1023 by Jelmer Vernooij
Set and verify testament.
61
from bzrlib.testament import (
62
    StrictTestament3,
63
    )
0.200.292 by Jelmer Vernooij
Fix formatting.
64
from bzrlib.tsort import (
65
    topo_sort,
66
    )
0.200.417 by Jelmer Vernooij
use insert_record_stream rather than add_lines.
67
from bzrlib.versionedfile import (
0.200.811 by Jelmer Vernooij
Use ChunkedContentFactory when possible.
68
    ChunkedContentFactory,
0.200.417 by Jelmer Vernooij
use insert_record_stream rather than add_lines.
69
    )
0.200.135 by Jelmer Vernooij
Add stub for fetching data.
70
0.231.2 by Jelmer Vernooij
Add -Dverify flag (not fully implemented yet).
71
from bzrlib.plugins.git.mapping import (
0.200.345 by Jelmer Vernooij
Keep track of file modes to use.
72
    DEFAULT_FILE_MODE,
0.200.521 by Jelmer Vernooij
Abstract out kind mapping a bit, initial work on support tree-references.
73
    mode_is_executable,
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
74
    mode_kind,
0.200.490 by Jelmer Vernooij
Warn about unusual modes and escaped XML-invalid characters.
75
    warn_unusual_mode,
0.231.2 by Jelmer Vernooij
Add -Dverify flag (not fully implemented yet).
76
    )
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
77
from bzrlib.plugins.git.object_store import (
78
    BazaarObjectStore,
0.200.852 by Jelmer Vernooij
Cache trees rather than inventories.
79
    LRUTreeCache,
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
80
    _tree_to_objects,
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
81
    )
0.259.4 by Jelmer Vernooij
Put determine_wants methods on InterRepo.
82
from bzrlib.plugins.git.refs import extract_tags
0.200.426 by Jelmer Vernooij
Fix import of RemoteGitRepository.
83
from bzrlib.plugins.git.remote import (
84
    RemoteGitRepository,
85
    )
0.200.169 by Jelmer Vernooij
Fix branch cloning.
86
from bzrlib.plugins.git.repository import (
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
87
    GitRepository,
0.200.289 by Jelmer Vernooij
Cope with new member variables in RepositoryFormat.
88
    GitRepositoryFormat,
0.200.426 by Jelmer Vernooij
Fix import of RemoteGitRepository.
89
    LocalGitRepository,
0.200.261 by Jelmer Vernooij
More formatting fixes.
90
    )
0.216.4 by Jelmer Vernooij
Add basic pack fetch infrastructure.
91
92
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
93
def import_git_blob(texts, mapping, path, name, (base_hexsha, hexsha), 
0.200.848 by Jelmer Vernooij
remove unnecessary parent_inv_shamap.
94
        base_inv, parent_id, revision_id,
0.200.896 by Jelmer Vernooij
Add separate function for looking up file ids.
95
        parent_invs, lookup_object, (base_mode, mode), store_updater,
96
        lookup_file_id):
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
97
    """Import a git blob object into a bzr repository.
98
0.200.261 by Jelmer Vernooij
More formatting fixes.
99
    :param texts: VersionedFiles to add to
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
100
    :param path: Path in the tree
101
    :param blob: A git blob
0.229.1 by Jelmer Vernooij
Start working with inventory deltas.
102
    :return: Inventory delta for this file
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
103
    """
0.252.28 by Jelmer Vernooij
Don't import control files.
104
    if mapping.is_control_file(path):
105
        return []
0.200.816 by Jelmer Vernooij
Leave mode handling for blobs to import_git_blob.
106
    if base_hexsha == hexsha and base_mode == mode:
107
        # If nothing has changed since the base revision, we're done
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
108
        return []
0.200.896 by Jelmer Vernooij
Add separate function for looking up file ids.
109
    file_id = lookup_file_id(path)
0.200.816 by Jelmer Vernooij
Leave mode handling for blobs to import_git_blob.
110
    if stat.S_ISLNK(mode):
0.200.320 by Jelmer Vernooij
Handle lightweight checkouts.
111
        cls = InventoryLink
112
    else:
113
        cls = InventoryFile
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
114
    ie = cls(file_id, name.decode("utf-8"), parent_id)
0.200.995 by Jelmer Vernooij
Support newer versions of bzr where only some InventoryFile/InventoryLink attributes are writable.
115
    if ie.kind == "file":
116
        ie.executable = mode_is_executable(mode)
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
117
    if base_hexsha == hexsha and mode_kind(base_mode) == mode_kind(mode):
118
        base_ie = base_inv[base_inv.path2id(path)]
0.200.373 by Jelmer Vernooij
Re-use inventory entries rather than looking them up again and again.
119
        ie.text_size = base_ie.text_size
120
        ie.text_sha1 = base_ie.text_sha1
0.200.995 by Jelmer Vernooij
Support newer versions of bzr where only some InventoryFile/InventoryLink attributes are writable.
121
        if ie.kind == "symlink":
122
            ie.symlink_target = base_ie.symlink_target
0.200.537 by Jelmer Vernooij
Fix handling of not-executable files becoming executable without any other changes.
123
        if ie.executable == base_ie.executable:
124
            ie.revision = base_ie.revision
125
        else:
126
            blob = lookup_object(hexsha)
0.200.304 by Jelmer Vernooij
Try a bit harder to avoid fetching objects we don't need.
127
    else:
128
        blob = lookup_object(hexsha)
0.200.320 by Jelmer Vernooij
Handle lightweight checkouts.
129
        if ie.kind == "symlink":
0.200.551 by Jelmer Vernooij
Properly set InventoryEntry revision when changing symlink targets.
130
            ie.revision = None
0.200.320 by Jelmer Vernooij
Handle lightweight checkouts.
131
            ie.symlink_target = blob.data
132
        else:
0.200.830 by Jelmer Vernooij
Bump minimum dulwich version.
133
            ie.text_size = sum(imap(len, blob.chunked))
134
            ie.text_sha1 = osutils.sha_strings(blob.chunked)
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
135
    # Check what revision we should store
0.200.283 by Jelmer Vernooij
Avoid storing repeated texts for blobs.
136
    parent_keys = []
0.200.904 by Jelmer Vernooij
Fix inconsistent parents.
137
    for pinv in parent_invs:
0.200.829 by Jelmer Vernooij
Cope with the fact that _type is gone in upstream dulwich.
138
        try:
139
            pie = pinv[file_id]
140
        except NoSuchId:
141
            continue
0.252.25 by Jelmer Vernooij
Reformatting.
142
        if (pie.text_sha1 == ie.text_sha1 and
143
            pie.executable == ie.executable and
144
            pie.symlink_target == ie.symlink_target):
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
145
            # found a revision in one of the parents to use
0.200.373 by Jelmer Vernooij
Re-use inventory entries rather than looking them up again and again.
146
            ie.revision = pie.revision
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
147
            break
0.200.904 by Jelmer Vernooij
Fix inconsistent parents.
148
        parent_key = (file_id, pie.revision)
149
        if not parent_key in parent_keys:
150
            parent_keys.append(parent_key)
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
151
    if ie.revision is None:
152
        # Need to store a new revision
153
        ie.revision = revision_id
154
        assert ie.revision is not None
0.200.698 by Jelmer Vernooij
Merge fixes for SHA1s of symlinks.
155
        if ie.kind == 'symlink':
0.200.811 by Jelmer Vernooij
Use ChunkedContentFactory when possible.
156
            chunks = []
0.200.1292 by Jelmer Vernooij
Fix repeeling objects when determining what to send.
157
        else:
0.200.830 by Jelmer Vernooij
Bump minimum dulwich version.
158
            chunks = blob.chunked
0.252.25 by Jelmer Vernooij
Reformatting.
159
        texts.insert_record_stream([
160
            ChunkedContentFactory((file_id, ie.revision),
161
                tuple(parent_keys), ie.text_sha1, chunks)])
0.200.572 by Jelmer Vernooij
Avoid some extra path lookups.
162
    invdelta = []
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
163
    if base_hexsha is not None:
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
164
        old_path = path.decode("utf-8") # Renames are not supported yet
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
165
        if stat.S_ISDIR(base_mode):
0.200.826 by Jelmer Vernooij
Fix some long lines.
166
            invdelta.extend(remove_disappeared_children(base_inv, old_path,
167
                lookup_object(base_hexsha), [], lookup_object))
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
168
    else:
169
        old_path = None
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
170
    new_path = path.decode("utf-8")
171
    invdelta.append((old_path, new_path, file_id, ie))
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
172
    if base_hexsha != hexsha:
0.200.952 by Jelmer Vernooij
Write git pack files rather than loose objects.
173
        store_updater.add_object(blob, ie, path)
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
174
    return invdelta
0.200.261 by Jelmer Vernooij
More formatting fixes.
175
176
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
177
class SubmodulesRequireSubtrees(BzrError):
0.200.666 by Jelmer Vernooij
Refuse to add tree references to non-subtree formats.
178
    _fmt = """The repository you are fetching from contains submodules. To continue, upgrade your Bazaar repository to a format that supports nested trees, such as 'development-subtree'."""
0.239.5 by Jelmer Vernooij
Print user-understandable error message when encountering submodules.
179
    internal = False
180
181
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
182
def import_git_submodule(texts, mapping, path, name, (base_hexsha, hexsha),
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
183
    base_inv, parent_id, revision_id, parent_invs, lookup_object,
0.200.896 by Jelmer Vernooij
Add separate function for looking up file ids.
184
    (base_mode, mode), store_updater, lookup_file_id):
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
185
    if base_hexsha == hexsha and base_mode == mode:
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
186
        return [], {}
0.200.896 by Jelmer Vernooij
Add separate function for looking up file ids.
187
    file_id = lookup_file_id(path)
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
188
    ie = TreeReference(file_id, name.decode("utf-8"), parent_id)
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
189
    ie.revision = revision_id
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
190
    if base_hexsha is None:
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
191
        oldpath = None
192
    else:
193
        oldpath = path
194
    ie.reference_revision = mapping.revision_id_foreign_to_bzr(hexsha)
0.252.25 by Jelmer Vernooij
Reformatting.
195
    texts.insert_record_stream([
196
        ChunkedContentFactory((file_id, ie.revision), (), None, [])])
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
197
    invdelta = [(oldpath, path, file_id, ie)]
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
198
    return invdelta, {}
0.200.540 by Jelmer Vernooij
Handle submodules explicitly.
199
200
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
201
def remove_disappeared_children(base_inv, path, base_tree, existing_children,
202
        lookup_object):
0.200.930 by Jelmer Vernooij
Add assert demonstrating 571055 and triggering it for all target formats.
203
    """Generate an inventory delta for removed children.
204
205
    :param base_inv: Base inventory against which to generate the 
206
        inventory delta.
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
207
    :param path: Path to process (unicode)
0.200.930 by Jelmer Vernooij
Add assert demonstrating 571055 and triggering it for all target formats.
208
    :param base_tree: Git Tree base object
209
    :param existing_children: Children that still exist
210
    :param lookup_object: Lookup a git object by its SHA1
211
    :return: Inventory delta, as list
212
    """
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
213
    assert type(path) is unicode
0.200.552 by Jelmer Vernooij
Cope with directories becoming symlinks.
214
    ret = []
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
215
    for name, mode, hexsha in base_tree.iteritems():
216
        if name in existing_children:
217
            continue
218
        c_path = posixpath.join(path, name.decode("utf-8"))
0.200.930 by Jelmer Vernooij
Add assert demonstrating 571055 and triggering it for all target formats.
219
        file_id = base_inv.path2id(c_path)
220
        assert file_id is not None
221
        ret.append((c_path, None, file_id, None))
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
222
        if stat.S_ISDIR(mode):
223
            ret.extend(remove_disappeared_children(
224
                base_inv, c_path, lookup_object(hexsha), [], lookup_object))
0.200.552 by Jelmer Vernooij
Cope with directories becoming symlinks.
225
    return ret
226
227
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
228
def import_git_tree(texts, mapping, path, name, (base_hexsha, hexsha),
0.200.848 by Jelmer Vernooij
remove unnecessary parent_inv_shamap.
229
        base_inv, parent_id, revision_id, parent_invs,
0.200.896 by Jelmer Vernooij
Add separate function for looking up file ids.
230
        lookup_object, (base_mode, mode), store_updater,
231
        lookup_file_id, allow_submodules=False):
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
232
    """Import a git tree object into a bzr repository.
233
0.200.261 by Jelmer Vernooij
More formatting fixes.
234
    :param texts: VersionedFiles object to add to
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
235
    :param path: Path in the tree (str)
236
    :param name: Name of the tree (str)
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
237
    :param tree: A git tree object
0.229.2 by Jelmer Vernooij
Initial work relying on inventory deltas.
238
    :param base_inv: Base inventory against which to return inventory delta
0.229.1 by Jelmer Vernooij
Start working with inventory deltas.
239
    :return: Inventory delta for this subtree
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
240
    """
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
241
    assert type(path) is str
242
    assert type(name) is str
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
243
    if base_hexsha == hexsha and base_mode == mode:
244
        # If nothing has changed since the base revision, we're done
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
245
        return [], {}
0.200.344 by Jelmer Vernooij
Clarify names, use convenience function
246
    invdelta = []
0.200.896 by Jelmer Vernooij
Add separate function for looking up file ids.
247
    file_id = lookup_file_id(path)
0.200.297 by Jelmer Vernooij
Cope with non-ascii characters in filenames (needs a test..).
248
    # We just have to hope this is indeed utf-8:
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
249
    ie = InventoryDirectory(file_id, name.decode("utf-8"), parent_id)
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
250
    tree = lookup_object(hexsha)
251
    if base_hexsha is None:
252
        base_tree = None
0.200.823 by Jelmer Vernooij
Simplify logic in import_git_tree a bit.
253
        old_path = None # Newly appeared here
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
254
    else:
255
        base_tree = lookup_object(base_hexsha)
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
256
        old_path = path.decode("utf-8") # Renames aren't supported yet
257
    new_path = path.decode("utf-8")
0.200.823 by Jelmer Vernooij
Simplify logic in import_git_tree a bit.
258
    if base_tree is None or type(base_tree) is not Tree:
259
        ie.revision = revision_id
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
260
        invdelta.append((old_path, new_path, ie.file_id, ie))
0.252.24 by Jelmer Vernooij
Support reading fileid map.
261
        texts.insert_record_stream([
262
            ChunkedContentFactory((ie.file_id, ie.revision), (), None, [])])
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
263
    # Remember for next time
0.200.300 by Jelmer Vernooij
Fix recursive deletion of dirs.
264
    existing_children = set()
0.200.345 by Jelmer Vernooij
Keep track of file modes to use.
265
    child_modes = {}
0.200.1147 by Jelmer Vernooij
Use Tree.items() rather than Tree.entries().
266
    for name, child_mode, child_hexsha in tree.iteritems():
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
267
        existing_children.add(name)
0.200.819 by Jelmer Vernooij
Avoid decoding basename twice.
268
        child_path = posixpath.join(path, name)
0.200.814 by Jelmer Vernooij
Avoid the use of InventoryDirectory.children. This speeds up
269
        if type(base_tree) is Tree:
270
            try:
271
                child_base_mode, child_base_hexsha = base_tree[name]
272
            except KeyError:
273
                child_base_hexsha = None
274
                child_base_mode = 0
275
        else:
276
            child_base_hexsha = None
277
            child_base_mode = 0
0.200.816 by Jelmer Vernooij
Leave mode handling for blobs to import_git_blob.
278
        if stat.S_ISDIR(child_mode):
0.252.25 by Jelmer Vernooij
Reformatting.
279
            subinvdelta, grandchildmodes = import_git_tree(texts, mapping,
280
                child_path, name, (child_base_hexsha, child_hexsha), base_inv,
0.200.1059 by Jelmer Vernooij
Fix graph tests.
281
                file_id, revision_id, parent_invs, lookup_object,
0.252.25 by Jelmer Vernooij
Reformatting.
282
                (child_base_mode, child_mode), store_updater, lookup_file_id,
283
                allow_submodules=allow_submodules)
0.200.816 by Jelmer Vernooij
Leave mode handling for blobs to import_git_blob.
284
        elif S_ISGITLINK(child_mode): # submodule
0.200.666 by Jelmer Vernooij
Refuse to add tree references to non-subtree formats.
285
            if not allow_submodules:
286
                raise SubmodulesRequireSubtrees()
0.252.25 by Jelmer Vernooij
Reformatting.
287
            subinvdelta, grandchildmodes = import_git_submodule(texts, mapping,
288
                child_path, name, (child_base_hexsha, child_hexsha), base_inv,
289
                file_id, revision_id, parent_invs, lookup_object,
290
                (child_base_mode, child_mode), store_updater, lookup_file_id)
0.200.352 by Jelmer Vernooij
Simplify mode handling.
291
        else:
0.252.25 by Jelmer Vernooij
Reformatting.
292
            subinvdelta = import_git_blob(texts, mapping, child_path, name,
293
                (child_base_hexsha, child_hexsha), base_inv, file_id,
294
                revision_id, parent_invs, lookup_object,
295
                (child_base_mode, child_mode), store_updater, lookup_file_id)
0.200.757 by Jelmer Vernooij
Use inventory deltas.
296
            grandchildmodes = {}
297
        child_modes.update(grandchildmodes)
298
        invdelta.extend(subinvdelta)
0.200.816 by Jelmer Vernooij
Leave mode handling for blobs to import_git_blob.
299
        if child_mode not in (stat.S_IFDIR, DEFAULT_FILE_MODE,
0.200.359 by Jelmer Vernooij
Simplify file mode handling, avoid inventory_to_tree_and_blobs as it is expensive if trees/blobs have already been converted.
300
                        stat.S_IFLNK, DEFAULT_FILE_MODE|0111):
0.200.879 by Jelmer Vernooij
Fix unusual modes.
301
            child_modes[child_path] = child_mode
0.229.3 by Jelmer Vernooij
Use inventory deltas internally so fetch is O(changes) rather than O(tree).
302
    # Remove any children that have disappeared
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
303
    if base_tree is not None and type(base_tree) is Tree:
0.200.984 by Jelmer Vernooij
Handle non-ascii characters in filenames.
304
        invdelta.extend(remove_disappeared_children(base_inv, old_path,
0.200.820 by Jelmer Vernooij
Avoid relying on InventoryDirectory.children.
305
            base_tree, existing_children, lookup_object))
0.200.952 by Jelmer Vernooij
Write git pack files rather than loose objects.
306
    store_updater.add_object(tree, ie, path)
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
307
    return invdelta, child_modes
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
308
309
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
310
def verify_commit_reconstruction(target_git_object_retriever, lookup_object,
0.200.1047 by Jelmer Vernooij
Fix -Dverify.
311
    o, rev, ret_tree, parent_trees, mapping, unusual_modes, verifiers):
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
312
    new_unusual_modes = mapping.export_unusual_file_modes(rev)
313
    if new_unusual_modes != unusual_modes:
314
        raise AssertionError("unusual modes don't match: %r != %r" % (
315
            unusual_modes, new_unusual_modes))
316
    # Verify that we can reconstruct the commit properly
0.200.1047 by Jelmer Vernooij
Fix -Dverify.
317
    rec_o = target_git_object_retriever._reconstruct_commit(rev, o.tree, True,
318
        verifiers)
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
319
    if rec_o != o:
320
        raise AssertionError("Reconstructed commit differs: %r != %r" % (
321
            rec_o, o))
322
    diff = []
323
    new_objs = {}
324
    for path, obj, ie in _tree_to_objects(ret_tree, parent_trees,
0.252.30 by Jelmer Vernooij
Support creating dummy files for empty directories.
325
        target_git_object_retriever._cache.idmap, unusual_modes, mapping.BZR_DUMMY_FILE):
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
326
        old_obj_id = tree_lookup_path(lookup_object, o.tree, path)[1]
327
        new_objs[path] = obj
328
        if obj.id != old_obj_id:
329
            diff.append((path, lookup_object(old_obj_id), obj))
330
    for (path, old_obj, new_obj) in diff:
331
        while (old_obj.type_name == "tree" and
332
               new_obj.type_name == "tree" and
333
               sorted(old_obj) == sorted(new_obj)):
334
            for name in old_obj:
335
                if old_obj[name][0] != new_obj[name][0]:
0.252.25 by Jelmer Vernooij
Reformatting.
336
                    raise AssertionError("Modes for %s differ: %o != %o" %
337
                        (path, old_obj[name][0], new_obj[name][0]))
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
338
                if old_obj[name][1] != new_obj[name][1]:
339
                    # Found a differing child, delve deeper
340
                    path = posixpath.join(path, name)
341
                    old_obj = lookup_object(old_obj[name][1])
342
                    new_obj = new_objs[path]
343
                    break
344
        raise AssertionError("objects differ for %s: %r != %r" % (path,
345
            old_obj, new_obj))
346
347
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
348
def import_git_commit(repo, mapping, head, lookup_object,
0.200.852 by Jelmer Vernooij
Cache trees rather than inventories.
349
                      target_git_object_retriever, trees_cache):
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
350
    o = lookup_object(head)
0.261.5 by Jelmer Vernooij
Fix looking up of parents during fetch.
351
    # Note that this uses mapping.revision_id_foreign_to_bzr. If the parents
352
    # were bzr roundtripped revisions they would be specified in the
353
    # roundtrip data.
0.261.4 by Jelmer Vernooij
Fix tests.
354
    rev, roundtrip_revid, verifiers = mapping.import_commit(
0.261.5 by Jelmer Vernooij
Fix looking up of parents during fetch.
355
        o, mapping.revision_id_foreign_to_bzr)
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
356
    # We have to do this here, since we have to walk the tree and
357
    # we need to make sure to import the blobs / trees with the right
358
    # path; this may involve adding them more than once.
0.200.852 by Jelmer Vernooij
Cache trees rather than inventories.
359
    parent_trees = trees_cache.revision_trees(rev.parent_ids)
360
    if parent_trees == []:
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
361
        base_inv = Inventory(root_id=None)
0.200.814 by Jelmer Vernooij
Avoid the use of InventoryDirectory.children. This speeds up
362
        base_tree = None
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
363
        base_mode = None
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
364
    else:
0.200.852 by Jelmer Vernooij
Cache trees rather than inventories.
365
        base_inv = parent_trees[0].inventory
0.200.814 by Jelmer Vernooij
Avoid the use of InventoryDirectory.children. This speeds up
366
        base_tree = lookup_object(o.parents[0]).tree
0.200.817 by Jelmer Vernooij
Deal with all modes locally.
367
        base_mode = stat.S_IFDIR
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
368
    store_updater = target_git_object_retriever._get_updater(rev)
0.200.988 by Jelmer Vernooij
Some formatting cleanups.
369
    fileid_map = mapping.get_fileid_map(lookup_object, o.tree)
0.200.839 by Jelmer Vernooij
Add convenience object for updating the object store caching layer.
370
    inv_delta, unusual_modes = import_git_tree(repo.texts,
0.200.988 by Jelmer Vernooij
Some formatting cleanups.
371
            mapping, "", "", (base_tree, o.tree), base_inv,
0.200.852 by Jelmer Vernooij
Cache trees rather than inventories.
372
            None, rev.revision_id, [p.inventory for p in parent_trees],
373
            lookup_object, (base_mode, stat.S_IFDIR), store_updater,
0.200.988 by Jelmer Vernooij
Some formatting cleanups.
374
            fileid_map.lookup_file_id,
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
375
            allow_submodules=getattr(repo._format, "supports_tree_reference", False))
376
    if unusual_modes != {}:
377
        for path, mode in unusual_modes.iteritems():
378
            warn_unusual_mode(rev.foreign_revid, path, mode)
379
        mapping.import_unusual_file_modes(rev, unusual_modes)
380
    try:
381
        basis_id = rev.parent_ids[0]
382
    except IndexError:
383
        basis_id = NULL_REVISION
384
        base_inv = None
385
    rev.inventory_sha1, inv = repo.add_inventory_by_delta(basis_id,
0.200.988 by Jelmer Vernooij
Some formatting cleanups.
386
              inv_delta, rev.revision_id, rev.parent_ids, base_inv)
0.200.1195 by Jelmer Vernooij
Cope with new StrictTestament3 arguments.
387
    ret_tree = InventoryRevisionTree(repo, inv, rev.revision_id)
0.200.1021 by Jelmer Vernooij
Put testament sha1 in revisions.
388
    if roundtrip_revid is not None:
0.200.1023 by Jelmer Vernooij
Set and verify testament.
389
        original_revid = rev.revision_id
0.200.1021 by Jelmer Vernooij
Put testament sha1 in revisions.
390
        rev.revision_id = roundtrip_revid
0.200.1195 by Jelmer Vernooij
Cope with new StrictTestament3 arguments.
391
        # Check verifiers
392
        if getattr(StrictTestament3, "from_revision_tree", None):
393
            testament = StrictTestament3(rev, ret_tree)
394
        else: # bzr < 2.4
395
            testament = StrictTestament3(rev, inv)
396
        calculated_verifiers = { "testament3-sha1": testament.as_sha1() }
0.200.1029 by Jelmer Vernooij
Use dictionary with verifiers rather than requiring testament3-sha1 everywhere.
397
        if calculated_verifiers != verifiers:
0.200.1023 by Jelmer Vernooij
Set and verify testament.
398
            trace.mutter("Testament SHA1 %r for %r did not match %r.",
0.200.1029 by Jelmer Vernooij
Use dictionary with verifiers rather than requiring testament3-sha1 everywhere.
399
                         calculated_verifiers["testament3-sha1"],
400
                         rev.revision_id, verifiers["testament3-sha1"])
0.200.1023 by Jelmer Vernooij
Set and verify testament.
401
            rev.revision_id = original_revid
0.200.1179 by Jelmer Vernooij
Avoid using verifiers for natively imported revisions, save a lot of time.
402
    else:
403
        calculated_verifiers = {}
0.200.1029 by Jelmer Vernooij
Use dictionary with verifiers rather than requiring testament3-sha1 everywhere.
404
    store_updater.add_object(o, calculated_verifiers, None)
405
    store_updater.finish()
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
406
    trees_cache.add(ret_tree)
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
407
    repo.add_revision(rev.revision_id, rev)
408
    if "verify" in debug.debug_flags:
0.200.883 by Jelmer Vernooij
Add function for verifying reconstruction of objects still works.
409
        verify_commit_reconstruction(target_git_object_retriever, 
410
            lookup_object, o, rev, ret_tree, parent_trees, mapping,
0.200.1047 by Jelmer Vernooij
Fix -Dverify.
411
            unusual_modes, verifiers)
0.200.679 by Jelmer Vernooij
Moving commit import functionality to a separate function.
412
413
0.248.5 by Jelmer Vernooij
Reformatting, fix dpush.
414
def import_git_objects(repo, mapping, object_iter,
415
    target_git_object_retriever, heads, pb=None, limit=None):
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
416
    """Import a set of git objects into a bzr repository.
417
0.200.483 by Jelmer Vernooij
Add NEWS entry about sha map.
418
    :param repo: Target Bazaar repository
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
419
    :param mapping: Mapping to use
420
    :param object_iter: Iterator over Git objects.
0.248.5 by Jelmer Vernooij
Reformatting, fix dpush.
421
    :return: Tuple with pack hints and last imported revision id
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
422
    """
0.200.469 by Jelmer Vernooij
Fix fetch when revisions are already present locally, just only mapped.
423
    def lookup_object(sha):
424
        try:
425
            return object_iter[sha]
426
        except KeyError:
427
            return target_git_object_retriever[sha]
0.200.158 by Jelmer Vernooij
fetch works \o/
428
    graph = []
0.200.296 by Jelmer Vernooij
Avoid iterating over all objects just to find the *Commits* to retrieve.
429
    checked = set()
0.200.734 by Jelmer Vernooij
Don't import head revision twice when pulling from Git.
430
    heads = list(set(heads))
0.200.852 by Jelmer Vernooij
Cache trees rather than inventories.
431
    trees_cache = LRUTreeCache(repo)
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
432
    # Find and convert commit objects
0.200.296 by Jelmer Vernooij
Avoid iterating over all objects just to find the *Commits* to retrieve.
433
    while heads:
434
        if pb is not None:
435
            pb.update("finding revisions to fetch", len(graph), None)
436
        head = heads.pop()
437
        assert isinstance(head, str)
0.200.310 by Jelmer Vernooij
Fix pull from remote branches.
438
        try:
0.248.5 by Jelmer Vernooij
Reformatting, fix dpush.
439
            o = lookup_object(head)
0.200.310 by Jelmer Vernooij
Fix pull from remote branches.
440
        except KeyError:
441
            continue
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
442
        if isinstance(o, Commit):
0.200.1029 by Jelmer Vernooij
Use dictionary with verifiers rather than requiring testament3-sha1 everywhere.
443
            rev, roundtrip_revid, verifiers = mapping.import_commit(o,
0.261.6 by Jelmer Vernooij
Use mapping.revision_id_foreign_to_bzr to find parents everywhere.
444
                mapping.revision_id_foreign_to_bzr)
0.200.1021 by Jelmer Vernooij
Put testament sha1 in revisions.
445
            if (repo.has_revision(rev.revision_id) or
446
                (roundtrip_revid and repo.has_revision(roundtrip_revid))):
0.200.295 by Jelmer Vernooij
Don't re-import revisions already fetched.
447
                continue
0.200.668 by Jelmer Vernooij
Fix some places where we were way too much memory for repositories with a large number of entries in the inventory and a large number of revisions.
448
            graph.append((o.id, o.parents))
0.200.296 by Jelmer Vernooij
Avoid iterating over all objects just to find the *Commits* to retrieve.
449
            heads.extend([p for p in o.parents if p not in checked])
0.200.303 by Jelmer Vernooij
Cope with tags during fetch.
450
        elif isinstance(o, Tag):
0.200.734 by Jelmer Vernooij
Don't import head revision twice when pulling from Git.
451
            if o.object[1] not in checked:
452
                heads.append(o.object[1])
0.200.296 by Jelmer Vernooij
Avoid iterating over all objects just to find the *Commits* to retrieve.
453
        else:
454
            trace.warning("Unable to import head object %r" % o)
0.200.668 by Jelmer Vernooij
Fix some places where we were way too much memory for repositories with a large number of entries in the inventory and a large number of revisions.
455
        checked.add(o.id)
456
    del checked
0.200.158 by Jelmer Vernooij
fetch works \o/
457
    # Order the revisions
0.200.151 by Jelmer Vernooij
Support converting git objects to bzr objects.
458
    # Create the inventory objects
0.200.821 by Jelmer Vernooij
Remove last references to ID.children.
459
    batch_size = 1000
0.200.680 by Jelmer Vernooij
fetch revisions in batches
460
    revision_ids = topo_sort(graph)
461
    pack_hints = []
0.247.2 by Michael Hudson
this works for my tests, but i'm pretty sure it's wrong in general
462
    if limit is not None:
463
        revision_ids = revision_ids[:limit]
0.247.3 by Michael Hudson
oh, so it wasn't (particularly) wrong, but it was a bit obscure
464
    last_imported = None
0.200.680 by Jelmer Vernooij
fetch revisions in batches
465
    for offset in range(0, len(revision_ids), batch_size):
0.254.33 by Jelmer Vernooij
Merge trunk.
466
        target_git_object_retriever.start_write_group() 
0.200.680 by Jelmer Vernooij
fetch revisions in batches
467
        try:
0.254.33 by Jelmer Vernooij
Merge trunk.
468
            repo.start_write_group()
469
            try:
0.200.824 by Jelmer Vernooij
Commit cache data in batches as well.
470
                for i, head in enumerate(
471
                    revision_ids[offset:offset+batch_size]):
0.254.33 by Jelmer Vernooij
Merge trunk.
472
                    if pb is not None:
0.200.824 by Jelmer Vernooij
Commit cache data in batches as well.
473
                        pb.update("fetching revisions", offset+i,
474
                                  len(revision_ids))
0.254.33 by Jelmer Vernooij
Merge trunk.
475
                    import_git_commit(repo, mapping, head, lookup_object,
0.252.25 by Jelmer Vernooij
Reformatting.
476
                        target_git_object_retriever, trees_cache)
0.254.33 by Jelmer Vernooij
Merge trunk.
477
                    last_imported = head
478
            except:
479
                repo.abort_write_group()
480
                raise
481
            else:
482
                hint = repo.commit_write_group()
483
                if hint is not None:
484
                    pack_hints.extend(hint)
0.200.680 by Jelmer Vernooij
fetch revisions in batches
485
        except:
0.254.33 by Jelmer Vernooij
Merge trunk.
486
            target_git_object_retriever.abort_write_group()
0.200.680 by Jelmer Vernooij
fetch revisions in batches
487
            raise
488
        else:
0.254.33 by Jelmer Vernooij
Merge trunk.
489
            target_git_object_retriever.commit_write_group()
0.247.2 by Michael Hudson
this works for my tests, but i'm pretty sure it's wrong in general
490
    return pack_hints, last_imported
0.200.141 by Jelmer Vernooij
Separate out local and remote fetching.
491
492
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
493
class InterGitRepository(InterRepository):
0.200.135 by Jelmer Vernooij
Add stub for fetching data.
494
0.200.289 by Jelmer Vernooij
Cope with new member variables in RepositoryFormat.
495
    _matching_repo_format = GitRepositoryFormat()
0.200.143 by Jelmer Vernooij
Reoncile InterGitRepository objects.
496
0.200.1154 by Jelmer Vernooij
Share more code in InterGitRepository.
497
    def _target_has_shas(self, shas):
498
        raise NotImplementedError(self._target_has_shas)
499
500
    def get_determine_wants_heads(self, wants, include_tags=False):
501
        wants = set(wants)
502
        def determine_wants(refs):
503
            potential = set(wants)
504
            if include_tags:
0.200.1300 by Jelmer Vernooij
Fix formatting.
505
                potential.update(
506
                    [v[1] or v[0] for v in extract_tags(refs).itervalues()])
0.200.1154 by Jelmer Vernooij
Share more code in InterGitRepository.
507
            return list(potential - self._target_has_shas(potential))
508
        return determine_wants
509
510
    def determine_wants_all(self, refs):
0.200.1300 by Jelmer Vernooij
Fix formatting.
511
        potential = set([sha for (ref, sha) in refs.iteritems() if not
512
            ref.endswith("^{}")])
0.200.1154 by Jelmer Vernooij
Share more code in InterGitRepository.
513
        return list(potential - self._target_has_shas(potential))
514
0.200.143 by Jelmer Vernooij
Reoncile InterGitRepository objects.
515
    @staticmethod
516
    def _get_repo_format_to_test():
517
        return None
518
0.200.135 by Jelmer Vernooij
Add stub for fetching data.
519
    def copy_content(self, revision_id=None, pb=None):
520
        """See InterRepository.copy_content."""
521
        self.fetch(revision_id, pb, find_ghosts=False)
522
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
523
524
class InterGitNonGitRepository(InterGitRepository):
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
525
    """Base InterRepository that copies revisions from a Git into a non-Git
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
526
    repository."""
527
0.259.4 by Jelmer Vernooij
Put determine_wants methods on InterRepo.
528
    def _target_has_shas(self, shas):
529
        revids = [self.source.lookup_foreign_revision_id(sha) for sha in shas]
530
        return self.target.has_revisions(revids)
531
0.259.6 by Jelmer Vernooij
Fetch tags during pull.
532
    def get_determine_wants_revids(self, revids, include_tags=False):
533
        wants = set()
534
        for revid in set(revids):
535
            git_sha, mapping = self.source.lookup_bzr_revision_id(revid)
536
            wants.add(git_sha)
537
        return self.get_determine_wants_heads(wants, include_tags=include_tags)
538
0.200.1001 by Jelmer Vernooij
Simplify handling of determine wants, add stub for fetch_objects().
539
    def fetch_objects(self, determine_wants, mapping, pb=None, limit=None):
540
        """Fetch objects from a remote server.
541
542
        :param determine_wants: determine_wants callback
543
        :param mapping: BzrGitMapping to use
544
        :param pb: Optional progress bar
545
        :param limit: Maximum number of commits to import.
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
546
        :return: Tuple with pack hint, last imported revision id and remote refs
0.200.1001 by Jelmer Vernooij
Simplify handling of determine wants, add stub for fetch_objects().
547
        """
548
        raise NotImplementedError(self.fetch_objects)
549
0.200.940 by Jelmer Vernooij
Avoid confusion between different fetch functions with different semantics.
550
    def fetch(self, revision_id=None, pb=None, find_ghosts=False,
0.200.247 by Jelmer Vernooij
Fix git-import.
551
              mapping=None, fetch_spec=None):
0.200.225 by Jelmer Vernooij
Implement custom InterBranch to support fetching from remote git branches.
552
        if mapping is None:
553
            mapping = self.source.get_mapping()
0.226.2 by Jelmer Vernooij
Cope with new fetch_spec argument.
554
        if revision_id is not None:
555
            interesting_heads = [revision_id]
556
        elif fetch_spec is not None:
0.200.1089 by Jelmer Vernooij
Cope with fancy fetch_spec behaviour.
557
            recipe = fetch_spec.get_recipe()
558
            if recipe[0] in ("search", "proxy-search"):
559
                interesting_heads = recipe[1]
560
            else:
0.200.1300 by Jelmer Vernooij
Fix formatting.
561
                raise AssertionError("Unsupported search result type %s" %
562
                        recipe[0])
0.226.2 by Jelmer Vernooij
Cope with new fetch_spec argument.
563
        else:
564
            interesting_heads = None
0.259.4 by Jelmer Vernooij
Put determine_wants methods on InterRepo.
565
566
        if interesting_heads is not None:
567
            determine_wants = self.get_determine_wants_revids(interesting_heads,
568
                include_tags=False)
569
        else:
570
            determine_wants = self.determine_wants_all
0.200.1079 by Jelmer Vernooij
Avoid looking up revid if not necessary.
571
572
        (pack_hint, _, remote_refs) = self.fetch_objects(determine_wants,
573
            mapping, pb)
0.200.579 by Jelmer Vernooij
Only pack if it makes the target repo smaller.
574
        if pack_hint is not None and self.target._format.pack_compresses:
0.200.578 by Jelmer Vernooij
Only do optimal packing on bzr >= 1.17.
575
            self.target.pack(hint=pack_hint)
0.200.1176 by Jelmer Vernooij
Fix fetch return value for inter git fetching.
576
        assert isinstance(remote_refs, dict)
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
577
        return remote_refs
0.200.225 by Jelmer Vernooij
Implement custom InterBranch to support fetching from remote git branches.
578
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
579
0.200.563 by Jelmer Vernooij
Attempt to parse progress indication from git status reports.
580
_GIT_PROGRESS_RE = re.compile(r"(.*?): +(\d+)% \((\d+)/(\d+)\)")
581
def report_git_progress(pb, text):
582
    text = text.rstrip("\r\n")
583
    g = _GIT_PROGRESS_RE.match(text)
584
    if g is not None:
585
        (text, pct, current, total) = g.groups()
586
        pb.update(text, int(current), int(total))
587
    else:
588
        pb.update(text, 0, 0)
589
590
0.200.1001 by Jelmer Vernooij
Simplify handling of determine wants, add stub for fetch_objects().
591
class DetermineWantsRecorder(object):
592
593
    def __init__(self, actual):
594
        self.actual = actual
595
        self.wants = []
596
        self.remote_refs = {}
597
598
    def __call__(self, refs):
599
        self.remote_refs = refs
600
        self.wants = self.actual(refs)
601
        return self.wants
602
603
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
604
class InterRemoteGitNonGitRepository(InterGitNonGitRepository):
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
605
    """InterRepository that copies revisions from a remote Git into a non-Git
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
606
    repository."""
607
0.200.582 by Jelmer Vernooij
Use more efficient algorithm for finding out heads.
608
    def get_target_heads(self):
609
        # FIXME: This should be more efficient
610
        all_revs = self.target.all_revision_ids()
611
        parent_map = self.target.get_parent_map(all_revs)
612
        all_parents = set()
613
        map(all_parents.update, parent_map.itervalues())
614
        return set(all_revs) - all_parents
615
0.247.2 by Michael Hudson
this works for my tests, but i'm pretty sure it's wrong in general
616
    def fetch_objects(self, determine_wants, mapping, pb=None, limit=None):
0.200.1001 by Jelmer Vernooij
Simplify handling of determine wants, add stub for fetch_objects().
617
        """See `InterGitNonGitRepository`."""
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
618
        def progress(text):
0.200.563 by Jelmer Vernooij
Attempt to parse progress indication from git status reports.
619
            report_git_progress(pb, text)
0.200.466 by Jelmer Vernooij
Fix finding of heads for fetch_objects.
620
        store = BazaarObjectStore(self.target, mapping)
0.200.1212 by Jelmer Vernooij
Support read locking object stores.
621
        store.lock_write()
0.200.465 by Jelmer Vernooij
Use dulwich standard functionality for finding missing revisions.
622
        try:
0.200.582 by Jelmer Vernooij
Use more efficient algorithm for finding out heads.
623
            heads = self.get_target_heads()
0.200.484 by Jelmer Vernooij
Cope with kind changes.
624
            graph_walker = store.get_graph_walker(
625
                    [store._lookup_revision_sha1(head) for head in heads])
0.200.1001 by Jelmer Vernooij
Simplify handling of determine wants, add stub for fetch_objects().
626
            wants_recorder = DetermineWantsRecorder(determine_wants)
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
627
0.200.484 by Jelmer Vernooij
Cope with kind changes.
628
            create_pb = None
629
            if pb is None:
630
                create_pb = pb = ui.ui_factory.nested_progress_bar()
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
631
            try:
0.200.1000 by Jelmer Vernooij
Fix fetch between local and remote git branches.
632
                objects_iter = self.source.fetch_objects(
0.200.1001 by Jelmer Vernooij
Simplify handling of determine wants, add stub for fetch_objects().
633
                    wants_recorder, graph_walker, store.get_raw,
0.200.1000 by Jelmer Vernooij
Fix fetch between local and remote git branches.
634
                    progress)
0.200.1300 by Jelmer Vernooij
Fix formatting.
635
                trace.mutter("Importing %d new revisions",
636
                             len(wants_recorder.wants))
637
                (pack_hint, last_rev) = import_git_objects(self.target,
638
                    mapping, objects_iter, store, wants_recorder.wants, pb,
639
                    limit)
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
640
                return (pack_hint, last_rev, wants_recorder.remote_refs)
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
641
            finally:
0.200.484 by Jelmer Vernooij
Cope with kind changes.
642
                if create_pb:
643
                    create_pb.finished()
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
644
        finally:
0.200.1212 by Jelmer Vernooij
Support read locking object stores.
645
            store.unlock()
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
646
647
    @staticmethod
648
    def is_compatible(source, target):
649
        """Be compatible with GitRepository."""
0.200.1222 by Jelmer Vernooij
Better checks in is_compatible methods.
650
        if not isinstance(source, RemoteGitRepository):
651
            return False
652
        if not target.supports_rich_root():
653
            return False
654
        if isinstance(target, GitRepository):
655
            return False
0.200.1270 by Jelmer Vernooij
Cope with older versions of bzr.
656
        if not getattr(target._format, "supports_full_versioned_files", True):
0.200.1222 by Jelmer Vernooij
Better checks in is_compatible methods.
657
            return False
658
        return True
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
659
660
661
class InterLocalGitNonGitRepository(InterGitNonGitRepository):
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
662
    """InterRepository that copies revisions from a local Git into a non-Git
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
663
    repository."""
664
0.247.2 by Michael Hudson
this works for my tests, but i'm pretty sure it's wrong in general
665
    def fetch_objects(self, determine_wants, mapping, pb=None, limit=None):
0.200.1001 by Jelmer Vernooij
Simplify handling of determine wants, add stub for fetch_objects().
666
        """See `InterGitNonGitRepository`."""
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
667
        remote_refs = self.source._git.get_refs()
668
        wants = determine_wants(remote_refs)
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
669
        create_pb = None
670
        if pb is None:
671
            create_pb = pb = ui.ui_factory.nested_progress_bar()
0.200.320 by Jelmer Vernooij
Handle lightweight checkouts.
672
        target_git_object_retriever = BazaarObjectStore(self.target, mapping)
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
673
        try:
0.200.1212 by Jelmer Vernooij
Support read locking object stores.
674
            target_git_object_retriever.lock_write()
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
675
            try:
0.200.1300 by Jelmer Vernooij
Fix formatting.
676
                (pack_hint, last_rev) = import_git_objects(self.target,
677
                    mapping, self.source._git.object_store,
0.248.5 by Jelmer Vernooij
Reformatting, fix dpush.
678
                    target_git_object_retriever, wants, pb, limit)
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
679
                return (pack_hint, last_rev, remote_refs)
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
680
            finally:
0.200.1212 by Jelmer Vernooij
Support read locking object stores.
681
                target_git_object_retriever.unlock()
0.200.306 by Jelmer Vernooij
Fix tests, split up InterGitNonGitRepository.
682
        finally:
683
            if create_pb:
684
                create_pb.finished()
685
686
    @staticmethod
687
    def is_compatible(source, target):
688
        """Be compatible with GitRepository."""
0.200.1222 by Jelmer Vernooij
Better checks in is_compatible methods.
689
        if not isinstance(source, LocalGitRepository):
690
            return False
691
        if not target.supports_rich_root():
692
            return False
693
        if isinstance(target, GitRepository):
694
            return False
0.200.1266 by Jelmer Vernooij
Fix 2.3 support.
695
        if not getattr(target._format, "supports_full_versioned_files", True):
0.200.1222 by Jelmer Vernooij
Better checks in is_compatible methods.
696
            return False
697
        return True
0.200.175 by Jelmer Vernooij
Add optimized handling when fetching from git to git.
698
699
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
700
class InterGitGitRepository(InterGitRepository):
0.200.291 by Jelmer Vernooij
Print proper error about not supporting push.
701
    """InterRepository that copies between Git repositories."""
0.200.175 by Jelmer Vernooij
Add optimized handling when fetching from git to git.
702
0.200.635 by Jelmer Vernooij
Fix fetching between git repositories.
703
    def fetch_objects(self, determine_wants, mapping, pb=None):
704
        def progress(text):
705
            trace.note("git: %s", text)
706
        graphwalker = self.target._git.get_graph_walker()
0.200.695 by Jelmer Vernooij
Clean up trailing whitespace.
707
        if (isinstance(self.source, LocalGitRepository) and
708
            isinstance(self.target, LocalGitRepository)):
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
709
            refs = self.source._git.fetch(self.target._git, determine_wants,
0.200.635 by Jelmer Vernooij
Fix fetching between git repositories.
710
                progress)
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
711
            return (None, None, refs)
0.200.695 by Jelmer Vernooij
Clean up trailing whitespace.
712
        elif (isinstance(self.source, LocalGitRepository) and
713
              isinstance(self.target, RemoteGitRepository)):
0.200.635 by Jelmer Vernooij
Fix fetching between git repositories.
714
            raise NotImplementedError
0.200.695 by Jelmer Vernooij
Clean up trailing whitespace.
715
        elif (isinstance(self.source, RemoteGitRepository) and
716
              isinstance(self.target, LocalGitRepository)):
0.200.635 by Jelmer Vernooij
Fix fetching between git repositories.
717
            f, commit = self.target._git.object_store.add_thin_pack()
718
            try:
0.200.1003 by Jelmer Vernooij
Initial work on supporting move_in_thin_pack.
719
                refs = self.source.bzrdir.root_transport.fetch_pack(
720
                    determine_wants, graphwalker, f.write, progress)
0.200.635 by Jelmer Vernooij
Fix fetching between git repositories.
721
                commit()
0.200.1002 by Jelmer Vernooij
Fix regression in git-import.
722
                return (None, None, refs)
0.200.635 by Jelmer Vernooij
Fix fetching between git repositories.
723
            except:
724
                f.close()
725
                raise
726
        else:
727
            raise AssertionError
728
0.200.1154 by Jelmer Vernooij
Share more code in InterGitRepository.
729
    def _target_has_shas(self, shas):
730
        return set([sha for sha in shas if self.target._git.object_store])
731
0.200.940 by Jelmer Vernooij
Avoid confusion between different fetch functions with different semantics.
732
    def fetch(self, revision_id=None, pb=None, find_ghosts=False,
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
733
              mapping=None, fetch_spec=None, branches=None):
0.200.175 by Jelmer Vernooij
Add optimized handling when fetching from git to git.
734
        if mapping is None:
735
            mapping = self.source.get_mapping()
736
        r = self.target._git
0.226.2 by Jelmer Vernooij
Cope with new fetch_spec argument.
737
        if revision_id is not None:
0.200.195 by Jelmer Vernooij
Return mapping in revision_id_bzr_to_foreign() as required by the interface.
738
            args = [mapping.revision_id_bzr_to_foreign(revision_id)[0]]
0.226.2 by Jelmer Vernooij
Cope with new fetch_spec argument.
739
        elif fetch_spec is not None:
0.200.1089 by Jelmer Vernooij
Cope with fancy fetch_spec behaviour.
740
            recipe = fetch_spec.get_recipe()
741
            if recipe[0] in ("search", "proxy-search"):
742
                heads = recipe[1]
743
            else:
744
                raise AssertionError("Unsupported search result type %s" % recipe[0])
745
            args = [mapping.revision_id_bzr_to_foreign(revid)[0] for revid in heads]
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
746
        if branches is not None:
0.200.1176 by Jelmer Vernooij
Fix fetch return value for inter git fetching.
747
            determine_wants = lambda x: [x[y] for y in branches if not x[y] in r.object_store and x[y] != ZERO_SHA]
0.200.456 by Jelmer Vernooij
Fix git -> git fetching.
748
        elif fetch_spec is None and revision_id is None:
0.200.1154 by Jelmer Vernooij
Share more code in InterGitRepository.
749
            determine_wants = self.determine_wants_all
0.226.2 by Jelmer Vernooij
Cope with new fetch_spec argument.
750
        else:
0.200.1176 by Jelmer Vernooij
Fix fetch return value for inter git fetching.
751
            determine_wants = lambda x: [y for y in args if not y in r.object_store and y != ZERO_SHA]
752
        wants_recorder = DetermineWantsRecorder(determine_wants)
753
        self.fetch_objects(wants_recorder, mapping)
754
        return wants_recorder.remote_refs
0.200.175 by Jelmer Vernooij
Add optimized handling when fetching from git to git.
755
756
    @staticmethod
757
    def is_compatible(source, target):
758
        """Be compatible with GitRepository."""
0.200.664 by Jelmer Vernooij
Support submodules during fetch.
759
        return (isinstance(source, GitRepository) and
0.200.175 by Jelmer Vernooij
Add optimized handling when fetching from git to git.
760
                isinstance(target, GitRepository))
0.200.1174 by Jelmer Vernooij
Fix specific revision fetching between git repositories.
761
762
    def get_determine_wants_revids(self, revids, include_tags=False):
763
        wants = set()
764
        for revid in set(revids):
765
            git_sha, mapping = self.source.lookup_bzr_revision_id(revid)
766
            wants.add(git_sha)
767
        return self.get_determine_wants_heads(wants, include_tags=include_tags)