/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
2520.4.85 by Aaron Bentley
Get all test passing (which just proves there aren't enough tests!)
1
# Copyright (C) 2007 Canonical Ltd
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
2520.4.20 by Aaron Bentley
Compress and base64-encode bundle contents
17
from cStringIO import StringIO
2520.4.26 by Aaron Bentley
Make decompression reasonably memory-efficient
18
import bz2
2520.4.130 by Aaron Bentley
Finish tweaking decode_name
19
import re
2520.4.20 by Aaron Bentley
Compress and base64-encode bundle contents
20
2520.4.13 by Aaron Bentley
Use real container implementation
21
from bzrlib import (
2520.4.40 by Aaron Bentley
Add human-readable diff to bundles
22
    diff,
2520.4.34 by Aaron Bentley
Add signature support
23
    errors,
2520.4.26 by Aaron Bentley
Make decompression reasonably memory-efficient
24
    iterablefile,
2520.4.13 by Aaron Bentley
Use real container implementation
25
    multiparent,
2520.4.97 by Aaron Bentley
Hack in support for inventory conversion
26
    osutils,
2520.4.13 by Aaron Bentley
Use real container implementation
27
    pack,
2520.4.40 by Aaron Bentley
Add human-readable diff to bundles
28
    revision as _mod_revision,
2520.4.45 by Aaron Bentley
Handle inconsistencies in last-modified-revision between vf and inventory
29
    trace,
2520.4.101 by Aaron Bentley
Use a registry to look up xml serializers by format
30
    xml_serializer,
2520.4.13 by Aaron Bentley
Use real container implementation
31
    )
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
32
from bzrlib.bundle import bundle_data, serializer
2520.4.56 by Aaron Bentley
Begin adding support for arbitrary metadata
33
from bzrlib.util import bencode
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
34
2520.4.4 by Aaron Bentley
Get basis support for a new bundle format in place
35
2520.4.25 by Aaron Bentley
Rename ContainerWriter/ContainerReader to BundleWriter/BundleReader
36
class BundleWriter(object):
2520.4.118 by Aaron Bentley
Add docs
37
    """Writer for bundle-format files.
38
39
    This serves roughly the same purpose as ContainerReader, but acts as a
40
    layer on top of it.
41
2520.4.123 by Aaron Bentley
Cleanup of bundle code
42
    Provides ways of writing the specific record types supported this bundle
2520.4.118 by Aaron Bentley
Add docs
43
    format.
44
    """
2520.4.123 by Aaron Bentley
Cleanup of bundle code
45
2520.4.23 by Aaron Bentley
Move responsability for encoding into container objects
46
    def __init__(self, fileobj):
2520.4.27 by Aaron Bentley
Use less memory when writing bzip-encoded files
47
        self._container = pack.ContainerWriter(self._write_encoded)
2520.4.23 by Aaron Bentley
Move responsability for encoding into container objects
48
        self._fileobj = fileobj
2520.4.27 by Aaron Bentley
Use less memory when writing bzip-encoded files
49
        self._compressor = bz2.BZ2Compressor()
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
50
2520.4.118 by Aaron Bentley
Add docs
51
    def _write_encoded(self, bytes):
52
        """Write bzip2-encoded bytes to the file"""
53
        self._fileobj.write(self._compressor.compress(bytes))
54
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
55
    def begin(self):
2520.4.118 by Aaron Bentley
Add docs
56
        """Start writing the bundle"""
2520.4.123 by Aaron Bentley
Cleanup of bundle code
57
        self._fileobj.write(serializer._get_bundle_header(
58
            serializer.v4_string))
2520.4.24 by Aaron Bentley
Move heading writing above container beginning
59
        self._fileobj.write('#\n')
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
60
        self._container.begin()
61
62
    def end(self):
2520.4.118 by Aaron Bentley
Add docs
63
        """Finish writing the bundle"""
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
64
        self._container.end()
2520.4.76 by Aaron Bentley
Move base64-encoding into merge directives
65
        self._fileobj.write(self._compressor.flush())
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
66
2520.4.60 by Aaron Bentley
Add sha1 verification for mpdiffs
67
    def add_multiparent_record(self, mp_bytes, sha1, parents, repo_kind,
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
68
                               revision_id, file_id):
2520.4.118 by Aaron Bentley
Add docs
69
        """Add a record for a multi-parent diff
70
71
        :mp_bytes: A multi-parent diff, as a bytestring
2520.4.123 by Aaron Bentley
Cleanup of bundle code
72
        :sha1: The sha1 hash of the fulltext
2520.4.118 by Aaron Bentley
Add docs
73
        :parents: a list of revision-ids of the parents
74
        :repo_kind: The kind of object in the repository.  May be 'file' or
75
            'inventory'
76
        :revision_id: The revision id of the mpdiff being added.
77
        :file_id: The file-id of the file, or None for inventories.
78
        """
2520.4.60 by Aaron Bentley
Add sha1 verification for mpdiffs
79
        metadata = {'parents': parents,
80
                    'storage_kind': 'mpdiff',
81
                    'sha1': sha1}
82
        self._add_record(mp_bytes, metadata, repo_kind, revision_id, file_id)
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
83
2520.4.123 by Aaron Bentley
Cleanup of bundle code
84
    def add_fulltext_record(self, bytes, parents, repo_kind, revision_id):
2520.4.118 by Aaron Bentley
Add docs
85
        """Add a record for a fulltext
86
87
        :bytes: The fulltext, as a bytestring
88
        :parents: a list of revision-ids of the parents
89
        :repo_kind: The kind of object in the repository.  May be 'revision' or
90
            'signature'
91
        :revision_id: The revision id of the fulltext being added.
92
        """
93
        metadata = {'parents': parents,
2520.5.3 by Aaron Bentley
fix sha1 in bundle format 4
94
                    'storage_kind': 'mpdiff'}
2520.4.60 by Aaron Bentley
Add sha1 verification for mpdiffs
95
        self._add_record(bytes, {'parents': parents,
2520.4.123 by Aaron Bentley
Cleanup of bundle code
96
            'storage_kind': 'fulltext'}, repo_kind, revision_id, None)
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
97
2520.4.95 by Aaron Bentley
Add support for header/info records
98
    def add_info_record(self, **kwargs):
2520.4.118 by Aaron Bentley
Add docs
99
        """Add an info record to the bundle
100
101
        Any parameters may be supplied, except 'self' and 'storage_kind'.
102
        Values must be lists, strings, integers, dicts, or a combination.
103
        """
2520.4.95 by Aaron Bentley
Add support for header/info records
104
        kwargs['storage_kind'] = 'header'
105
        self._add_record(None, kwargs, 'info', None, None)
106
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
107
    @staticmethod
2520.4.68 by Aaron Bentley
Change name separators to all-slash
108
    def encode_name(content_kind, revision_id, file_id=None):
2520.4.118 by Aaron Bentley
Add docs
109
        """Encode semantic ids as a container name"""
2520.4.95 by Aaron Bentley
Add support for header/info records
110
        assert content_kind in ('revision', 'file', 'inventory', 'signature',
111
                                'info')
2520.4.118 by Aaron Bentley
Add docs
112
113
        if content_kind == 'file':
114
            assert file_id is not None
115
        else:
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
116
            assert file_id is None
2520.4.95 by Aaron Bentley
Add support for header/info records
117
        if content_kind == 'info':
118
            assert revision_id is None
119
        else:
120
            assert revision_id is not None
2520.4.127 by Aaron Bentley
Fix up name encoding to handle revision-ids with slashes
121
        names = [n.replace('/', '//') for n in
122
                 (content_kind, revision_id, file_id) if n is not None]
2520.4.68 by Aaron Bentley
Change name separators to all-slash
123
        return '/'.join(names)
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
124
2520.4.56 by Aaron Bentley
Begin adding support for arbitrary metadata
125
    def _add_record(self, bytes, metadata, repo_kind, revision_id, file_id):
2520.4.118 by Aaron Bentley
Add docs
126
        """Add a bundle record to the container.
127
128
        Most bundle records are recorded as header/body pairs, with the
129
        body being nameless.  Records with storage_kind 'header' have no
130
        body.
131
        """
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
132
        name = self.encode_name(repo_kind, revision_id, file_id)
2520.4.95 by Aaron Bentley
Add support for header/info records
133
        encoded_metadata = bencode.bencode(metadata)
2682.1.1 by Robert Collins
* The ``bzrlib.pack`` interface has changed to use tuples of bytestrings
134
        self._container.add_bytes_record(encoded_metadata, [(name, )])
2520.4.95 by Aaron Bentley
Add support for header/info records
135
        if metadata['storage_kind'] != 'header':
136
            self._container.add_bytes_record(bytes, [])
2520.4.13 by Aaron Bentley
Use real container implementation
137
2520.4.7 by Aaron Bentley
Fix patch deserialization
138
2520.4.25 by Aaron Bentley
Rename ContainerWriter/ContainerReader to BundleWriter/BundleReader
139
class BundleReader(object):
2520.4.118 by Aaron Bentley
Add docs
140
    """Reader for bundle-format files.
141
142
    This serves roughly the same purpose as ContainerReader, but acts as a
143
    layer on top of it, providing metadata, a semantic name, and a record
144
    body
145
    """
2520.4.123 by Aaron Bentley
Cleanup of bundle code
146
2520.4.148 by Aaron Bentley
Updates from review
147
    def __init__(self, fileobj, stream_input=True):
2520.4.145 by Aaron Bentley
Add memory_friendly toggle, be memory-unfriendly for merge directives
148
        """Constructor
149
150
        :param fileobj: a file containing a bzip-encoded container
2520.4.148 by Aaron Bentley
Updates from review
151
        :param stream_input: If True, the BundleReader stream input rather than
152
            reading it all into memory at once.  Reading it into memory all at
153
            once is (currently) faster.
2520.4.145 by Aaron Bentley
Add memory_friendly toggle, be memory-unfriendly for merge directives
154
        """
2520.4.23 by Aaron Bentley
Move responsability for encoding into container objects
155
        line = fileobj.readline()
156
        if line != '\n':
157
            fileobj.readline()
2520.4.40 by Aaron Bentley
Add human-readable diff to bundles
158
        self.patch_lines = []
2520.4.148 by Aaron Bentley
Updates from review
159
        if stream_input:
2520.4.145 by Aaron Bentley
Add memory_friendly toggle, be memory-unfriendly for merge directives
160
            source_file = iterablefile.IterableFile(self.iter_decode(fileobj))
161
        else:
162
            source_file = StringIO(bz2.decompress(fileobj.read()))
2916.2.18 by Andrew Bennetts
Use iter_records_from_file rather than ContainerReader.
163
        self._container_file = source_file
2520.4.26 by Aaron Bentley
Make decompression reasonably memory-efficient
164
165
    @staticmethod
166
    def iter_decode(fileobj):
2520.4.118 by Aaron Bentley
Add docs
167
        """Iterate through decoded fragments of the file"""
2520.4.26 by Aaron Bentley
Make decompression reasonably memory-efficient
168
        decompressor = bz2.BZ2Decompressor()
169
        for line in fileobj:
2916.2.18 by Andrew Bennetts
Use iter_records_from_file rather than ContainerReader.
170
            try:
171
                yield decompressor.decompress(line)
172
            except EOFError:
173
                return
2520.4.22 by Aaron Bentley
Create ContainerReader
174
175
    @staticmethod
176
    def decode_name(name):
2520.4.118 by Aaron Bentley
Add docs
177
        """Decode a name from its container form into a semantic form
178
179
        :retval: content_kind, revision_id, file_id
180
        """
2520.4.130 by Aaron Bentley
Finish tweaking decode_name
181
        segments = re.split('(//?)', name)
182
        names = ['']
2520.4.127 by Aaron Bentley
Fix up name encoding to handle revision-ids with slashes
183
        for segment in segments:
184
            if segment == '//':
185
                names[-1] += '/'
2520.4.130 by Aaron Bentley
Finish tweaking decode_name
186
            elif segment == '/':
2520.4.127 by Aaron Bentley
Fix up name encoding to handle revision-ids with slashes
187
                names.append('')
188
            else:
189
                names[-1] += segment
2520.4.130 by Aaron Bentley
Finish tweaking decode_name
190
        content_kind = names[0]
2520.4.95 by Aaron Bentley
Add support for header/info records
191
        revision_id = None
192
        file_id = None
193
        if len(names) > 1:
194
            revision_id = names[1]
2520.4.68 by Aaron Bentley
Change name separators to all-slash
195
        if len(names) > 2:
196
            file_id = names[2]
197
        return content_kind, revision_id, file_id
2520.4.22 by Aaron Bentley
Create ContainerReader
198
199
    def iter_records(self):
2520.4.118 by Aaron Bentley
Add docs
200
        """Iterate through bundle records
201
202
        :return: a generator of (bytes, metadata, content_kind, revision_id,
203
            file_id)
204
        """
2916.2.18 by Andrew Bennetts
Use iter_records_from_file rather than ContainerReader.
205
        iterator = pack.iter_records_from_file(self._container_file)
206
        for names, bytes in iterator:
2520.4.131 by Aaron Bentley
Raise BadBundle for records with wrong number of names
207
            if len(names) != 1:
208
                raise errors.BadBundle('Record has %d names instead of 1'
209
                                       % len(names))
2916.2.18 by Andrew Bennetts
Use iter_records_from_file rather than ContainerReader.
210
            metadata = bencode.bdecode(bytes)
2520.4.95 by Aaron Bentley
Add support for header/info records
211
            if metadata['storage_kind'] == 'header':
212
                bytes = None
213
            else:
214
                _unused, bytes = iterator.next()
2682.1.1 by Robert Collins
* The ``bzrlib.pack`` interface has changed to use tuples of bytestrings
215
            yield (bytes, metadata) + self.decode_name(names[0][0])
2520.4.22 by Aaron Bentley
Create ContainerReader
216
217
2520.4.72 by Aaron Bentley
Rename format to 4alpha
218
class BundleSerializerV4(serializer.BundleSerializer):
2520.4.118 by Aaron Bentley
Add docs
219
    """Implement the high-level bundle interface"""
2520.4.123 by Aaron Bentley
Cleanup of bundle code
220
2520.4.4 by Aaron Bentley
Get basis support for a new bundle format in place
221
    def write(self, repository, revision_ids, forced_bases, fileobj):
2520.4.118 by Aaron Bentley
Add docs
222
        """Write a bundle to a file-like object
223
224
        For backwards-compatibility only
225
        """
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
226
        write_op = BundleWriteOperation.from_old_args(repository, revision_ids,
227
                                                      forced_bases, fileobj)
2520.4.53 by Aaron Bentley
refactor bundle serialization to make write_bundle primary
228
        return write_op.do_write()
229
230
    def write_bundle(self, repository, target, base, fileobj):
2520.4.118 by Aaron Bentley
Add docs
231
        """Write a bundle to a file object
232
233
        :param repository: The repository to retrieve revision data from
234
        :param target: The head revision to include ancestors of
235
        :param base: The ancestor of the target to stop including acestors
236
            at.
237
        :param fileobj: The file-like object to write to
238
        """
2520.4.53 by Aaron Bentley
refactor bundle serialization to make write_bundle primary
239
        write_op =  BundleWriteOperation(base, target, repository, fileobj)
240
        return write_op.do_write()
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
241
242
    def read(self, file):
2520.4.118 by Aaron Bentley
Add docs
243
        """return a reader object for a given file"""
2520.4.72 by Aaron Bentley
Rename format to 4alpha
244
        bundle = BundleInfoV4(file, self)
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
245
        return bundle
246
2520.4.101 by Aaron Bentley
Use a registry to look up xml serializers by format
247
    @staticmethod
248
    def get_source_serializer(info):
2520.4.118 by Aaron Bentley
Add docs
249
        """Retrieve the serializer for a given info object"""
2520.4.101 by Aaron Bentley
Use a registry to look up xml serializers by format
250
        return xml_serializer.format_registry.get(info['serializer'])
251
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
252
253
class BundleWriteOperation(object):
2520.4.118 by Aaron Bentley
Add docs
254
    """Perform the operation of writing revisions to a bundle"""
2520.4.123 by Aaron Bentley
Cleanup of bundle code
255
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
256
    @classmethod
257
    def from_old_args(cls, repository, revision_ids, forced_bases, fileobj):
2520.4.123 by Aaron Bentley
Cleanup of bundle code
258
        """Create a BundleWriteOperation from old-style arguments"""
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
259
        base, target = cls.get_base_target(revision_ids, forced_bases,
260
                                           repository)
261
        return BundleWriteOperation(base, target, repository, fileobj,
262
                                    revision_ids)
263
2520.4.53 by Aaron Bentley
refactor bundle serialization to make write_bundle primary
264
    def __init__(self, base, target, repository, fileobj, revision_ids=None):
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
265
        self.base = base
266
        self.target = target
267
        self.repository = repository
2520.4.39 by Aaron Bentley
Rename container => bundle(reader) where appropriate
268
        bundle = BundleWriter(fileobj)
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
269
        self.bundle = bundle
2520.4.64 by Aaron Bentley
Avoid topo sort for v10 bundles
270
        self.base_ancestry = set(repository.get_ancestry(base,
271
                                                         topo_sorted=False))
2520.4.53 by Aaron Bentley
refactor bundle serialization to make write_bundle primary
272
        if revision_ids is not None:
273
            self.revision_ids = revision_ids
274
        else:
2520.4.64 by Aaron Bentley
Avoid topo sort for v10 bundles
275
            revision_ids = set(repository.get_ancestry(target,
276
                                                       topo_sorted=False))
2520.4.55 by Aaron Bentley
Fix file revision selection to grab all dependencies properly
277
            self.revision_ids = revision_ids.difference(self.base_ancestry)
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
278
279
    def do_write(self):
2520.4.118 by Aaron Bentley
Add docs
280
        """Write all data to the bundle"""
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
281
        self.bundle.begin()
2520.4.97 by Aaron Bentley
Hack in support for inventory conversion
282
        self.write_info()
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
283
        self.write_files()
284
        self.write_revisions()
285
        self.bundle.end()
2520.4.53 by Aaron Bentley
refactor bundle serialization to make write_bundle primary
286
        return self.revision_ids
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
287
2520.4.97 by Aaron Bentley
Hack in support for inventory conversion
288
    def write_info(self):
2520.4.118 by Aaron Bentley
Add docs
289
        """Write format info"""
2520.4.113 by Aaron Bentley
Avoid peeking at Repository._serializer
290
        serializer_format = self.repository.get_serializer_format()
2520.4.99 by Aaron Bentley
Test conversion across models
291
        supports_rich_root = {True: 1, False: 0}[
292
            self.repository.supports_rich_root()]
2520.4.113 by Aaron Bentley
Avoid peeking at Repository._serializer
293
        self.bundle.add_info_record(serializer=serializer_format,
2520.4.99 by Aaron Bentley
Test conversion across models
294
                                    supports_rich_root=supports_rich_root)
2520.4.97 by Aaron Bentley
Hack in support for inventory conversion
295
2520.4.51 by Aaron Bentley
Split iteration through file revisions into a method, so we can vary it
296
    def iter_file_revisions(self):
2520.4.118 by Aaron Bentley
Add docs
297
        """Iterate through all relevant revisions of all files.
2520.4.51 by Aaron Bentley
Split iteration through file revisions into a method, so we can vary it
298
2520.4.118 by Aaron Bentley
Add docs
299
        This is the correct implementation, but is not compatible with bzr.dev,
300
        because certain old revisions were not converted correctly, and have
301
        the wrong "revision" marker in inventories.
2520.4.51 by Aaron Bentley
Split iteration through file revisions into a method, so we can vary it
302
        """
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
303
        transaction = self.repository.get_transaction()
304
        altered = self.repository.fileids_altered_by_revision_ids(
305
            self.revision_ids)
2520.4.6 by Aaron Bentley
Get installation started
306
        for file_id, file_revision_ids in altered.iteritems():
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
307
            vf = self.repository.weave_store.get_weave(file_id, transaction)
2520.4.51 by Aaron Bentley
Split iteration through file revisions into a method, so we can vary it
308
            yield vf, file_id, file_revision_ids
309
2520.4.55 by Aaron Bentley
Fix file revision selection to grab all dependencies properly
310
    def iter_file_revisions_aggressive(self):
2520.4.118 by Aaron Bentley
Add docs
311
        """Iterate through all relevant revisions of all files.
2520.4.55 by Aaron Bentley
Fix file revision selection to grab all dependencies properly
312
313
        This uses the standard iter_file_revisions to determine what revisions
314
        are referred to by inventories, but then uses the versionedfile to
315
        determine what the build-dependencies of each required revision.
316
317
        All build dependencies which are not ancestors of the base revision
318
        are emitted.
319
        """
320
        for vf, file_id, file_revision_ids in self.iter_file_revisions():
321
            new_revision_ids = set()
322
            pending = list(file_revision_ids)
323
            while len(pending) > 0:
324
                revision_id = pending.pop()
325
                if revision_id in new_revision_ids:
326
                    continue
327
                if revision_id in self.base_ancestry:
328
                    continue
329
                new_revision_ids.add(revision_id)
330
                pending.extend(vf.get_parents(revision_id))
331
            yield vf, file_id, new_revision_ids
332
2520.4.51 by Aaron Bentley
Split iteration through file revisions into a method, so we can vary it
333
    def write_files(self):
2520.4.118 by Aaron Bentley
Add docs
334
        """Write bundle records for all revisions of all files"""
2745.6.11 by Aaron Bentley
Fix knit file parents to follow parentage from revision/inventory XML
335
        for vf, file_id, revision_ids in self.iter_file_revisions():
2520.4.51 by Aaron Bentley
Split iteration through file revisions into a method, so we can vary it
336
            self.add_mp_records('file', file_id, vf, revision_ids)
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
337
338
    def write_revisions(self):
2520.4.118 by Aaron Bentley
Add docs
339
        """Write bundle records for all revisions and signatures"""
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
340
        inv_vf = self.repository.get_inventory_weave()
341
        revision_order = list(multiparent.topo_iter(inv_vf, self.revision_ids))
2520.4.75 by Aaron Bentley
Fix traceback on empty bundles.
342
        if self.target is not None and self.target in self.revision_ids:
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
343
            revision_order.remove(self.target)
344
            revision_order.append(self.target)
345
        self.add_mp_records('inventory', None, inv_vf, revision_order)
2520.4.114 by Aaron Bentley
Avoid deprecated method get_parent_names method
346
        parents_list = self.repository.get_parents(revision_order)
347
        for parents, revision_id in zip(parents_list, revision_order):
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
348
            revision_text = self.repository.get_revision_xml(revision_id)
349
            self.bundle.add_fulltext_record(revision_text, parents,
2520.4.123 by Aaron Bentley
Cleanup of bundle code
350
                                       'revision', revision_id)
2520.4.34 by Aaron Bentley
Add signature support
351
            try:
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
352
                self.bundle.add_fulltext_record(
353
                    self.repository.get_signature_text(
2520.4.123 by Aaron Bentley
Cleanup of bundle code
354
                    revision_id), parents, 'signature', revision_id)
2520.4.34 by Aaron Bentley
Add signature support
355
            except errors.NoSuchRevision:
356
                pass
357
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
358
    @staticmethod
359
    def get_base_target(revision_ids, forced_bases, repository):
2520.4.123 by Aaron Bentley
Cleanup of bundle code
360
        """Determine the base and target from old-style revision ids"""
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
361
        if len(revision_ids) == 0:
362
            return None, None
363
        target = revision_ids[0]
364
        base = forced_bases.get(target)
365
        if base is None:
366
            parents = repository.get_revision(target).parent_ids
367
            if len(parents) == 0:
368
                base = _mod_revision.NULL_REVISION
369
            else:
370
                base = parents[0]
371
        return base, target
372
373
    def add_mp_records(self, repo_kind, file_id, vf, revision_ids):
2520.4.118 by Aaron Bentley
Add docs
374
        """Add multi-parent diff records to a bundle"""
2520.4.41 by Aaron Bentley
Accelerate mpdiff generation
375
        revision_ids = list(multiparent.topo_iter(vf, revision_ids))
376
        mpdiffs = vf.make_mpdiffs(revision_ids)
2520.4.88 by Aaron Bentley
Retrieve all sha1s at once (ftw)
377
        sha1s = vf.get_sha1s(revision_ids)
378
        for mpdiff, revision_id, sha1, in zip(mpdiffs, revision_ids, sha1s):
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
379
            parents = vf.get_parents(revision_id)
2520.4.41 by Aaron Bentley
Accelerate mpdiff generation
380
            text = ''.join(mpdiff.to_patch())
2520.4.60 by Aaron Bentley
Add sha1 verification for mpdiffs
381
            self.bundle.add_multiparent_record(text, sha1, parents, repo_kind,
2520.4.50 by Aaron Bentley
Split write functionality out into a separate object
382
                                               revision_id, file_id)
2520.4.6 by Aaron Bentley
Get installation started
383
384
2520.4.72 by Aaron Bentley
Rename format to 4alpha
385
class BundleInfoV4(object):
2520.4.6 by Aaron Bentley
Get installation started
386
2520.4.118 by Aaron Bentley
Add docs
387
    """Provide (most of) the BundleInfo interface"""
2520.4.6 by Aaron Bentley
Get installation started
388
    def __init__(self, fileobj, serializer):
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
389
        self._fileobj = fileobj
390
        self._serializer = serializer
391
        self.__real_revisions = None
392
        self.__revisions = None
393
394
    def install(self, repository):
395
        return self.install_revisions(repository)
396
2520.4.148 by Aaron Bentley
Updates from review
397
    def install_revisions(self, repository, stream_input=True):
398
        """Install this bundle's revisions into the specified repository
399
400
        :param target_repo: The repository to install into
401
        :param stream_input: If True, will stream input rather than reading it
402
            all into memory at once.  Reading it into memory all at once is
403
            (currently) faster.
404
        """
2520.4.18 by Aaron Bentley
Generate mpdiffs for inventory
405
        repository.lock_write()
406
        try:
2520.4.148 by Aaron Bentley
Updates from review
407
            ri = RevisionInstaller(self.get_bundle_reader(stream_input),
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
408
                                   self._serializer, repository)
2520.4.18 by Aaron Bentley
Generate mpdiffs for inventory
409
            return ri.install()
410
        finally:
411
            repository.unlock()
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
412
2520.4.109 by Aaron Bentley
start work on directive cherry-picking
413
    def get_merge_request(self, target_repo):
414
        """Provide data for performing a merge
415
416
        Returns suggested base, suggested target, and patch verification status
417
        """
418
        return None, self.target, 'inapplicable'
419
2520.4.148 by Aaron Bentley
Updates from review
420
    def get_bundle_reader(self, stream_input=True):
421
        """Return a new BundleReader for the associated bundle
422
423
        :param stream_input: If True, the BundleReader stream input rather than
424
            reading it all into memory at once.  Reading it into memory all at
425
            once is (currently) faster.
426
        """
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
427
        self._fileobj.seek(0)
2520.4.148 by Aaron Bentley
Updates from review
428
        return BundleReader(self._fileobj, stream_input)
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
429
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
430
    def _get_real_revisions(self):
431
        if self.__real_revisions is None:
432
            self.__real_revisions = []
2520.4.39 by Aaron Bentley
Rename container => bundle(reader) where appropriate
433
            bundle_reader = self.get_bundle_reader()
2520.4.102 by Aaron Bentley
rename parents to metadata
434
            for bytes, metadata, repo_kind, revision_id, file_id in \
2520.4.39 by Aaron Bentley
Rename container => bundle(reader) where appropriate
435
                bundle_reader.iter_records():
2520.4.101 by Aaron Bentley
Use a registry to look up xml serializers by format
436
                if repo_kind == 'info':
437
                    serializer =\
2520.4.102 by Aaron Bentley
rename parents to metadata
438
                        self._serializer.get_source_serializer(metadata)
2520.4.22 by Aaron Bentley
Create ContainerReader
439
                if repo_kind == 'revision':
2520.4.101 by Aaron Bentley
Use a registry to look up xml serializers by format
440
                    rev = serializer.read_revision_from_string(bytes)
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
441
                    self.__real_revisions.append(rev)
442
        return self.__real_revisions
443
    real_revisions = property(_get_real_revisions)
444
445
    def _get_revisions(self):
446
        if self.__revisions is None:
447
            self.__revisions = []
448
            for revision in self.real_revisions:
2520.4.33 by Aaron Bentley
remove test dependencies on serialization minutia
449
                self.__revisions.append(
450
                    bundle_data.RevisionInfo.from_revision(revision))
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
451
        return self.__revisions
452
453
    revisions = property(_get_revisions)
454
2520.4.29 by Aaron Bentley
Reactivate some testing, fix topo_iter
455
    def _get_target(self):
456
        return self.revisions[-1].revision_id
457
458
    target = property(_get_target)
459
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
460
461
class RevisionInstaller(object):
2520.4.123 by Aaron Bentley
Cleanup of bundle code
462
    """Installs revisions into a repository"""
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
463
2520.4.21 by Aaron Bentley
Finish turning ContainerWriter into a new layer
464
    def __init__(self, container, serializer, repository):
465
        self._container = container
2520.4.6 by Aaron Bentley
Get installation started
466
        self._serializer = serializer
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
467
        self._repository = repository
2520.4.97 by Aaron Bentley
Hack in support for inventory conversion
468
        self._info = None
2520.4.99 by Aaron Bentley
Test conversion across models
469
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
470
    def install(self):
2592.4.1 by Martin Pool
RevisionInstaller now creates a write group for its work
471
        """Perform the installation.
472
        
473
        Must be called with the Repository locked.
474
        """
475
        self._repository.start_write_group()
476
        try:
2856.1.2 by Robert Collins
Review feedback.
477
            result = self._install_in_write_group()
2592.4.1 by Martin Pool
RevisionInstaller now creates a write group for its work
478
        except:
479
            self._repository.abort_write_group()
480
            raise
481
        self._repository.commit_write_group()
482
        return result
483
2856.1.2 by Robert Collins
Review feedback.
484
    def _install_in_write_group(self):
2520.4.6 by Aaron Bentley
Get installation started
485
        current_file = None
486
        current_versionedfile = None
487
        pending_file_records = []
2520.4.142 by Aaron Bentley
Clean up installation of inventory records
488
        inventory_vf = None
489
        pending_inventory_records = []
2520.4.8 by Aaron Bentley
Serialize inventory
490
        added_inv = set()
2520.4.29 by Aaron Bentley
Reactivate some testing, fix topo_iter
491
        target_revision = None
2520.4.58 by Aaron Bentley
Propogate support for metadata to iter_revisions, add storage kind
492
        for bytes, metadata, repo_kind, revision_id, file_id in\
2520.4.22 by Aaron Bentley
Create ContainerReader
493
            self._container.iter_records():
2520.4.97 by Aaron Bentley
Hack in support for inventory conversion
494
            if repo_kind == 'info':
495
                assert self._info is None
2520.4.123 by Aaron Bentley
Cleanup of bundle code
496
                self._handle_info(metadata)
2520.6.2 by Aaron Bentley
Fix bundle installation wrong-versionedfile bug
497
            if (repo_kind, file_id) != ('file', current_file):
498
                if len(pending_file_records) > 0:
499
                    self._install_mp_records(current_versionedfile,
500
                                             pending_file_records)
2520.4.8 by Aaron Bentley
Serialize inventory
501
                current_file = None
502
                current_versionedfile = None
503
                pending_file_records = []
2520.4.142 by Aaron Bentley
Clean up installation of inventory records
504
            if len(pending_inventory_records) > 0 and repo_kind != 'inventory':
505
                self._install_inventory_records(inventory_vf,
506
                                                pending_inventory_records)
507
                pending_inventory_records = []
508
            if repo_kind == 'inventory':
509
                if inventory_vf is None:
510
                    inventory_vf = self._repository.get_inventory_weave()
511
                if revision_id not in inventory_vf:
512
                    pending_inventory_records.append((revision_id, metadata,
513
                                                      bytes))
514
            if repo_kind == 'revision':
515
                target_revision = revision_id
516
                self._install_revision(revision_id, metadata, bytes)
517
            if repo_kind == 'signature':
518
                self._install_signature(revision_id, metadata, bytes)
2520.4.22 by Aaron Bentley
Create ContainerReader
519
            if repo_kind == 'file':
2520.4.142 by Aaron Bentley
Clean up installation of inventory records
520
                current_file = file_id
521
                if current_versionedfile is None:
2520.4.6 by Aaron Bentley
Get installation started
522
                    current_versionedfile = \
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
523
                        self._repository.weave_store.get_weave_or_empty(
524
                        file_id, self._repository.get_transaction())
2520.4.6 by Aaron Bentley
Get installation started
525
                    pending_file_records = []
526
                if revision_id in current_versionedfile:
527
                    continue
2520.4.59 by Aaron Bentley
Push metadata down the stack
528
                pending_file_records.append((revision_id, metadata, bytes))
2520.4.18 by Aaron Bentley
Generate mpdiffs for inventory
529
        self._install_mp_records(current_versionedfile, pending_file_records)
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
530
        return target_revision
2520.4.6 by Aaron Bentley
Get installation started
531
2520.4.123 by Aaron Bentley
Cleanup of bundle code
532
    def _handle_info(self, info):
533
        """Extract data from an info record"""
534
        self._info = info
535
        self._source_serializer = self._serializer.get_source_serializer(info)
536
        if (info['supports_rich_root'] == 0 and
537
            self._repository.supports_rich_root()):
538
            self.update_root = True
539
        else:
540
            self.update_root = False
541
2520.4.60 by Aaron Bentley
Add sha1 verification for mpdiffs
542
    def _install_mp_records(self, versionedfile, records):
2520.4.61 by Aaron Bentley
Do bulk insertion of records
543
        if len(records) == 0:
544
            return
545
        d_func = multiparent.MultiParent.from_patch
546
        vf_records = [(r, m['parents'], m['sha1'], d_func(t)) for r, m, t in
547
                      records if r not in versionedfile]
548
        versionedfile.add_mpdiffs(vf_records)
2520.4.8 by Aaron Bentley
Serialize inventory
549
2520.4.142 by Aaron Bentley
Clean up installation of inventory records
550
    def _install_inventory_records(self, vf, records):
2520.4.97 by Aaron Bentley
Hack in support for inventory conversion
551
        if self._info['serializer'] == self._repository._serializer.format_num:
2520.4.142 by Aaron Bentley
Clean up installation of inventory records
552
            return self._install_mp_records(vf, records)
553
        for revision_id, metadata, bytes in records:
554
            parent_ids = metadata['parents']
555
            parents = [self._repository.get_inventory(p)
556
                       for p in parent_ids]
557
            p_texts = [self._source_serializer.write_inventory_to_string(p)
558
                       for p in parents]
559
            target_lines = multiparent.MultiParent.from_patch(bytes).to_lines(
560
                p_texts)
561
            sha1 = osutils.sha_strings(target_lines)
562
            if sha1 != metadata['sha1']:
563
                raise errors.BadBundle("Can't convert to target format")
564
            target_inv = self._source_serializer.read_inventory_from_string(
565
                ''.join(target_lines))
566
            self._handle_root(target_inv, parent_ids)
567
            try:
568
                self._repository.add_inventory(revision_id, target_inv,
569
                                               parent_ids)
570
            except errors.UnsupportedInventoryKind:
571
                raise errors.IncompatibleRevision(repr(self._repository))
2520.4.99 by Aaron Bentley
Test conversion across models
572
573
    def _handle_root(self, target_inv, parent_ids):
574
        revision_id = target_inv.revision_id
575
        if self.update_root:
576
            target_inv.root.revision = revision_id
577
            store = self._repository.weave_store
578
            transaction = self._repository.get_transaction()
579
            vf = store.get_weave_or_empty(target_inv.root.file_id, transaction)
580
            vf.add_lines(revision_id, parent_ids, [])
581
        elif not self._repository.supports_rich_root():
582
            if target_inv.root.revision != revision_id:
583
                raise errors.IncompatibleRevision(repr(self._repository))
584
2520.4.10 by Aaron Bentley
Enable installation of revisions
585
2520.4.59 by Aaron Bentley
Push metadata down the stack
586
    def _install_revision(self, revision_id, metadata, text):
2520.4.14 by Aaron Bentley
Get most tests passing, use format header
587
        if self._repository.has_revision(revision_id):
588
            return
589
        self._repository._add_revision_text(revision_id, text)
2520.4.34 by Aaron Bentley
Add signature support
590
2520.4.59 by Aaron Bentley
Push metadata down the stack
591
    def _install_signature(self, revision_id, metadata, text):
2520.4.100 by Aaron Bentley
Fix repeat signature installs
592
        transaction = self._repository.get_transaction()
593
        if self._repository._revision_store.has_signature(revision_id,
594
                                                          transaction):
595
            return
2520.4.34 by Aaron Bentley
Add signature support
596
        self._repository._revision_store.add_revision_signature_text(
2520.4.100 by Aaron Bentley
Fix repeat signature installs
597
            revision_id, text, transaction)