/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
485 by Martin Pool
- move commit code into its own module
1
# Copyright (C) 2005 Canonical Ltd
1248 by Martin Pool
- new weave based cleanup [broken]
2
#
485 by Martin Pool
- move commit code into its own module
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
1248 by Martin Pool
- new weave based cleanup [broken]
7
#
485 by Martin Pool
- move commit code into its own module
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
1248 by Martin Pool
- new weave based cleanup [broken]
12
#
485 by Martin Pool
- move commit code into its own module
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
1248 by Martin Pool
- new weave based cleanup [broken]
18
# XXX: Can we do any better about making interrupted commits change
19
# nothing?  Perhaps the best approach is to integrate commit of
20
# AtomicFiles with releasing the lock on the Branch.
21
22
# TODO: Separate 'prepare' phase where we find a list of potentially
23
# committed files.  We then can then pause the commit to prompt for a
24
# commit message, knowing the summary will be the same as what's
25
# actually used for the commit.  (But perhaps simpler to simply get
26
# the tree status, then use that for a selective commit?)
27
28
# The newly committed revision is going to have a shape corresponding
29
# to that of the working inventory.  Files that are not in the
30
# working tree and that were in the predecessor are reported as
31
# removed --- this can include files that were either removed from the
32
# inventory or deleted in the working tree.  If they were only
33
# deleted from disk, they are removed from the working inventory.
34
35
# We then consider the remaining entries, which will be in the new
36
# version.  Directory entries are simply copied across.  File entries
37
# must be checked to see if a new version of the file should be
38
# recorded.  For each parent revision inventory, we check to see what
39
# version of the file was present.  If the file was present in at
40
# least one tree, and if it was the same version in all the trees,
41
# then we can just refer to that version.  Otherwise, a new version
42
# representing the merger of the file versions must be added.
43
44
# TODO: Update hashcache before and after - or does the WorkingTree
45
# look after that?
1245 by Martin Pool
doc
46
1264 by Martin Pool
- Raise a better error from commit when a parent is absent
47
# This code requires all merge parents to be present in the branch.
48
# We could relax this but for the sake of simplicity the constraint is
49
# here for now.  It's not totally clear to me how we'd know which file
50
# need new text versions if some parents are absent.  -- mbp 20050915
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
51
1339 by Martin Pool
- doc
52
# TODO: Rather than mashing together the ancestry and storing it back,
53
# perhaps the weave should have single method which does it all in one
54
# go, avoiding a lot of redundant work.
1335 by Martin Pool
doc
55
1341 by Martin Pool
- doc
56
# TODO: Perhaps give a warning if one of the revisions marked as
57
# merged is already in the ancestry, and then don't record it as a
58
# distinct parent.
59
1343 by Martin Pool
- fix up test for merge of trees
60
# TODO: If the file is newly merged but unchanged from the version it
61
# merges from, then it should still be reported as newly added
62
# relative to the basis revision.
63
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
64
1189 by Martin Pool
- BROKEN: partial support for commit into weave
65
import os
1390 by Robert Collins
pair programming worx... merge integration and weave
66
import re
1189 by Martin Pool
- BROKEN: partial support for commit into weave
67
import sys
1188 by Martin Pool
- clean up imports in commit code
68
import time
1248 by Martin Pool
- new weave based cleanup [broken]
69
import pdb
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
70
1188 by Martin Pool
- clean up imports in commit code
71
from binascii import hexlify
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
72
from cStringIO import StringIO
1188 by Martin Pool
- clean up imports in commit code
73
74
from bzrlib.osutils import (local_time_offset, username,
75
                            rand_bytes, compact_date, user_email,
76
                            kind_marker, is_inside_any, quotefn,
1248 by Martin Pool
- new weave based cleanup [broken]
77
                            sha_string, sha_strings, sha_file, isdir, isfile,
78
                            split_lines)
1352 by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves
79
from bzrlib.branch import gen_file_id
1264 by Martin Pool
- Raise a better error from commit when a parent is absent
80
from bzrlib.errors import (BzrError, PointlessCommit,
81
                           HistoryMissing,
82
                           )
1311 by Martin Pool
- remove RevisionReference; just hold parent ids directly
83
from bzrlib.revision import Revision
1264 by Martin Pool
- Raise a better error from commit when a parent is absent
84
from bzrlib.trace import mutter, note, warning
1189 by Martin Pool
- BROKEN: partial support for commit into weave
85
from bzrlib.xml5 import serializer_v5
1188 by Martin Pool
- clean up imports in commit code
86
from bzrlib.inventory import Inventory
1189 by Martin Pool
- BROKEN: partial support for commit into weave
87
from bzrlib.weave import Weave
88
from bzrlib.weavefile import read_weave, write_weave_v5
89
from bzrlib.atomicfile import AtomicFile
90
91
1205 by Martin Pool
- add bzrlib.commit.commit compatability interface
92
def commit(*args, **kwargs):
93
    """Commit a new revision to a branch.
94
95
    Function-style interface for convenience of old callers.
96
97
    New code should use the Commit class instead.
98
    """
1276 by Martin Pool
- make Branch.commit accept (and ignore) verbose argument
99
    ## XXX: Remove this in favor of Branch.commit?
1205 by Martin Pool
- add bzrlib.commit.commit compatability interface
100
    Commit().commit(*args, **kwargs)
101
102
1189 by Martin Pool
- BROKEN: partial support for commit into weave
103
class NullCommitReporter(object):
104
    """I report on progress of a commit."""
105
    def added(self, path):
106
        pass
107
108
    def removed(self, path):
109
        pass
110
111
    def renamed(self, old_path, new_path):
112
        pass
113
114
115
class ReportCommitToLog(NullCommitReporter):
116
    def added(self, path):
117
        note('added %s', path)
118
119
    def removed(self, path):
120
        note('removed %s', path)
121
122
    def renamed(self, old_path, new_path):
123
        note('renamed %s => %s', old_path, new_path)
124
125
126
class Commit(object):
127
    """Task of committing a new revision.
128
129
    This is a MethodObject: it accumulates state as the commit is
130
    prepared, and then it is discarded.  It doesn't represent
131
    historical revisions, just the act of recording a new one.
132
133
            missing_ids
134
            Modified to hold a list of files that have been deleted from
135
            the working directory; these should be removed from the
136
            working inventory.
485 by Martin Pool
- move commit code into its own module
137
    """
1189 by Martin Pool
- BROKEN: partial support for commit into weave
138
    def __init__(self,
139
                 reporter=None):
140
        if reporter is not None:
141
            self.reporter = reporter
142
        else:
143
            self.reporter = NullCommitReporter()
144
145
        
146
    def commit(self,
147
               branch, message,
148
               timestamp=None,
149
               timezone=None,
150
               committer=None,
151
               specific_files=None,
152
               rev_id=None,
1276 by Martin Pool
- make Branch.commit accept (and ignore) verbose argument
153
               allow_pointless=True,
154
               verbose=False):
1189 by Martin Pool
- BROKEN: partial support for commit into weave
155
        """Commit working copy as a new revision.
156
157
        timestamp -- if not None, seconds-since-epoch for a
158
             postdated/predated commit.
159
1253 by Martin Pool
- test that pointless commits are trapped
160
        specific_files -- If true, commit only those files.
1189 by Martin Pool
- BROKEN: partial support for commit into weave
161
1253 by Martin Pool
- test that pointless commits are trapped
162
        rev_id -- If set, use this as the new revision id.
1189 by Martin Pool
- BROKEN: partial support for commit into weave
163
            Useful for test or import commands that need to tightly
164
            control what revisions are assigned.  If you duplicate
165
            a revision id that exists elsewhere it is your own fault.
166
            If null (default), a time/random revision id is generated.
1253 by Martin Pool
- test that pointless commits are trapped
167
168
        allow_pointless -- If true (default), commit even if nothing
169
            has changed and no merges are recorded.
1189 by Martin Pool
- BROKEN: partial support for commit into weave
170
        """
1285 by Martin Pool
- fix bug in committing files that are renamed but not modified
171
        mutter('preparing to commit')
1189 by Martin Pool
- BROKEN: partial support for commit into weave
172
173
        self.branch = branch
1248 by Martin Pool
- new weave based cleanup [broken]
174
        self.weave_store = branch.weave_store
1189 by Martin Pool
- BROKEN: partial support for commit into weave
175
        self.rev_id = rev_id
176
        self.specific_files = specific_files
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
177
        self.allow_pointless = allow_pointless
1189 by Martin Pool
- BROKEN: partial support for commit into weave
178
179
        if timestamp is None:
180
            self.timestamp = time.time()
181
        else:
182
            self.timestamp = long(timestamp)
183
            
1248 by Martin Pool
- new weave based cleanup [broken]
184
        if rev_id is None:
185
            self.rev_id = _gen_revision_id(self.branch, self.timestamp)
186
        else:
187
            self.rev_id = rev_id
188
1189 by Martin Pool
- BROKEN: partial support for commit into weave
189
        if committer is None:
190
            self.committer = username(self.branch)
191
        else:
192
            assert isinstance(committer, basestring), type(committer)
193
            self.committer = committer
194
195
        if timezone is None:
196
            self.timezone = local_time_offset()
197
        else:
198
            self.timezone = int(timezone)
199
200
        assert isinstance(message, basestring), type(message)
201
        self.message = message
1390 by Robert Collins
pair programming worx... merge integration and weave
202
        self._escape_commit_message()
1189 by Martin Pool
- BROKEN: partial support for commit into weave
203
1245 by Martin Pool
doc
204
        self.branch.lock_write()
1189 by Martin Pool
- BROKEN: partial support for commit into weave
205
        try:
206
            self.work_tree = self.branch.working_tree()
207
            self.work_inv = self.work_tree.inventory
208
            self.basis_tree = self.branch.basis_tree()
209
            self.basis_inv = self.basis_tree.inventory
210
1223 by Martin Pool
- store inventories in weave
211
            self._gather_parents()
1344 by Martin Pool
- disallow selected-file commit of merges
212
            if len(self.parents) > 1 and self.specific_files:
213
                raise NotImplementedError('selected-file commit of merges is not supported yet')
1284 by Martin Pool
- in commit, avoid reading basis inventory twice
214
            self._check_parents_present()
215
            
1251 by Martin Pool
- fix up commit in directory with some deleted files
216
            self._remove_deleted()
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
217
            self._populate_new_inv()
218
            self._store_snapshot()
1248 by Martin Pool
- new weave based cleanup [broken]
219
            self._report_deletes()
1245 by Martin Pool
doc
220
1248 by Martin Pool
- new weave based cleanup [broken]
221
            if not (self.allow_pointless
1279 by Martin Pool
- pointless commit of r1 no longer allowed
222
                    or len(self.parents) > 1
1249 by Martin Pool
- improvements to weave commit [broken]
223
                    or self.new_inv != self.basis_inv):
1189 by Martin Pool
- BROKEN: partial support for commit into weave
224
                raise PointlessCommit()
225
226
            self._record_inventory()
1225 by Martin Pool
- branch now tracks ancestry - all merged revisions
227
            self._record_ancestry()
1189 by Martin Pool
- BROKEN: partial support for commit into weave
228
            self._make_revision()
1250 by Martin Pool
typo
229
            note('committed r%d {%s}', (self.branch.revno() + 1),
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
230
                 self.rev_id)
231
            self.branch.append_revision(self.rev_id)
1189 by Martin Pool
- BROKEN: partial support for commit into weave
232
            self.branch.set_pending_merges([])
233
        finally:
234
            self.branch.unlock()
235
236
1245 by Martin Pool
doc
237
1189 by Martin Pool
- BROKEN: partial support for commit into weave
238
    def _record_inventory(self):
1223 by Martin Pool
- store inventories in weave
239
        """Store the inventory for the new revision."""
1248 by Martin Pool
- new weave based cleanup [broken]
240
        inv_text = serializer_v5.write_inventory_to_string(self.new_inv)
241
        self.inv_sha1 = sha_string(inv_text)
1390 by Robert Collins
pair programming worx... merge integration and weave
242
        s = self.branch.control_weaves
1352 by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves
243
        s.add_text('inventory', self.rev_id,
1390 by Robert Collins
pair programming worx... merge integration and weave
244
                   split_lines(inv_text), self.parents)
1223 by Martin Pool
- store inventories in weave
245
1390 by Robert Collins
pair programming worx... merge integration and weave
246
    def _escape_commit_message(self):
247
        """Replace xml-incompatible control characters."""
1185.1.23 by Robert Collins
Harald Meland's xml escaping on commit patch
248
        # Python strings can include characters that can't be
249
        # represented in well-formed XML; escape characters that
250
        # aren't listed in the XML specification
251
        # (http://www.w3.org/TR/REC-xml/#NT-Char).
1390 by Robert Collins
pair programming worx... merge integration and weave
252
        if isinstance(self.message, unicode):
1185.1.23 by Robert Collins
Harald Meland's xml escaping on commit patch
253
            char_pattern = u'[^\x09\x0A\x0D\u0020-\uD7FF\uE000-\uFFFD]'
254
        else:
255
            # Use a regular 'str' as pattern to avoid having re.subn
256
            # return 'unicode' results.
257
            char_pattern = '[^x09\x0A\x0D\x20-\xFF]'
1390 by Robert Collins
pair programming worx... merge integration and weave
258
        self.message, escape_count = re.subn(
1185.1.23 by Robert Collins
Harald Meland's xml escaping on commit patch
259
            char_pattern,
260
            lambda match: match.group(0).encode('unicode_escape'),
1390 by Robert Collins
pair programming worx... merge integration and weave
261
            self.message)
1185.1.23 by Robert Collins
Harald Meland's xml escaping on commit patch
262
        if escape_count:
263
            note("replaced %d control characters in message", escape_count)
1223 by Martin Pool
- store inventories in weave
264
1225 by Martin Pool
- branch now tracks ancestry - all merged revisions
265
    def _record_ancestry(self):
1270 by Martin Pool
- fix recording of merged ancestry lines
266
        """Append merged revision ancestry to the ancestry file.
267
268
        This should be the merged ancestry of all parents, plus the
269
        new revision id."""
1390 by Robert Collins
pair programming worx... merge integration and weave
270
        s = self.branch.control_weaves
1352 by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves
271
        w = s.get_weave_or_empty('ancestry')
1333 by Martin Pool
- split out merge-ancestry stuff where it can be reused
272
        lines = self._make_ancestry(w)
1269 by Martin Pool
- some weave operations automatically look up symbolic names if supplied
273
        w.add(self.rev_id, self.parents, lines)
1352 by Martin Pool
- store control weaves in .bzr/, not mixed in with file weaves
274
        s.put_weave('ancestry', w)
1225 by Martin Pool
- branch now tracks ancestry - all merged revisions
275
276
1333 by Martin Pool
- split out merge-ancestry stuff where it can be reused
277
    def _make_ancestry(self, ancestry_weave):
1270 by Martin Pool
- fix recording of merged ancestry lines
278
        """Return merged ancestry lines.
279
280
        The lines are revision-ids followed by newlines."""
1333 by Martin Pool
- split out merge-ancestry stuff where it can be reused
281
        parent_ancestries = [ancestry_weave.get(p) for p in self.parents]
282
        new_lines = merge_ancestry_lines(self.rev_id, parent_ancestries)
283
        mutter('merged ancestry of {%s}:\n%s', self.rev_id, ''.join(new_lines))
284
        return new_lines
1270 by Martin Pool
- fix recording of merged ancestry lines
285
286
1223 by Martin Pool
- store inventories in weave
287
    def _gather_parents(self):
288
        pending_merges = self.branch.pending_merges()
289
        self.parents = []
1284 by Martin Pool
- in commit, avoid reading basis inventory twice
290
        self.parent_trees = []
1241 by Martin Pool
- rename last_patch to last_revision
291
        precursor_id = self.branch.last_revision()
1223 by Martin Pool
- store inventories in weave
292
        if precursor_id:
293
            self.parents.append(precursor_id)
1284 by Martin Pool
- in commit, avoid reading basis inventory twice
294
            self.parent_trees.append(self.basis_tree)
1223 by Martin Pool
- store inventories in weave
295
        self.parents += pending_merges
1284 by Martin Pool
- in commit, avoid reading basis inventory twice
296
        self.parent_trees.extend(map(self.branch.revision_tree, pending_merges))
297
298
299
    def _check_parents_present(self):
1264 by Martin Pool
- Raise a better error from commit when a parent is absent
300
        for parent_id in self.parents:
1270 by Martin Pool
- fix recording of merged ancestry lines
301
            mutter('commit parent revision {%s}', parent_id)
1264 by Martin Pool
- Raise a better error from commit when a parent is absent
302
            if not self.branch.has_revision(parent_id):
303
                warning("can't commit a merge from an absent parent")
304
                raise HistoryMissing(self.branch, 'revision', parent_id)
1284 by Martin Pool
- in commit, avoid reading basis inventory twice
305
306
            
1189 by Martin Pool
- BROKEN: partial support for commit into weave
307
    def _make_revision(self):
308
        """Record a new revision object for this commit."""
309
        self.rev = Revision(timestamp=self.timestamp,
310
                            timezone=self.timezone,
311
                            committer=self.committer,
312
                            message=self.message,
313
                            inventory_sha1=self.inv_sha1,
314
                            revision_id=self.rev_id)
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
315
        self.rev.parent_ids = self.parents
1248 by Martin Pool
- new weave based cleanup [broken]
316
        rev_tmp = StringIO()
1189 by Martin Pool
- BROKEN: partial support for commit into weave
317
        serializer_v5.write_revision(self.rev, rev_tmp)
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
318
        rev_tmp.seek(0)
1392 by Robert Collins
reinstate testfetch test case
319
        self.branch.revision_store.add(rev_tmp, self.rev_id, compressed=True)
1189 by Martin Pool
- BROKEN: partial support for commit into weave
320
        mutter('new revision_id is {%s}', self.rev_id)
321
322
323
    def _remove_deleted(self):
1248 by Martin Pool
- new weave based cleanup [broken]
324
        """Remove deleted files from the working inventories.
325
326
        This is done prior to taking the working inventory as the
327
        basis for the new committed inventory.
328
329
        This returns true if any files
330
        *that existed in the basis inventory* were deleted.
331
        Files that were added and deleted
332
        in the working copy don't matter.
333
        """
1254 by Martin Pool
- fix handling of selective commit with deleted files
334
        specific = self.specific_files
335
        deleted_ids = []
336
        for path, ie in self.work_inv.iter_entries():
337
            if specific and not is_inside_any(specific, path):
338
                continue
339
            if not self.work_tree.has_filename(path):
340
                note('missing %s', path)
341
                deleted_ids.append(ie.file_id)
342
        if deleted_ids:
343
            for file_id in deleted_ids:
1248 by Martin Pool
- new weave based cleanup [broken]
344
                del self.work_inv[file_id]
1249 by Martin Pool
- improvements to weave commit [broken]
345
            self.branch._write_inventory(self.work_inv)
1248 by Martin Pool
- new weave based cleanup [broken]
346
347
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
348
    def _find_entry_parents(self, file_id):
1248 by Martin Pool
- new weave based cleanup [broken]
349
        """Return the text versions and hashes for all file parents.
350
1285 by Martin Pool
- fix bug in committing files that are renamed but not modified
351
        Returned as a map from text version to inventory entry.
1248 by Martin Pool
- new weave based cleanup [broken]
352
353
        This is a set containing the file versions in all parents
354
        revisions containing the file.  If the file is new, the set
355
        will be empty."""
356
        r = {}
357
        for tree in self.parent_trees:
358
            if file_id in tree.inventory:
359
                ie = tree.inventory[file_id]
360
                assert ie.file_id == file_id
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
361
                if ie.revision in r:
362
                    assert r[ie.revision] == ie
1248 by Martin Pool
- new weave based cleanup [broken]
363
                else:
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
364
                    r[ie.revision] = ie
1303 by Martin Pool
- commit updates entry_version
365
        return r
366
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
367
    def _snapshot_entry(self, path, ie, previous_entries):
368
        """Store a single possibly changed inventory entry in the branch."""
369
        mutter('parents of %s are %r', path, previous_entries)
370
        if ie.revision is not None:
371
            # not selected for commit
372
            return
373
        if ie.kind == 'symlink':
374
            ie.read_symlink_target(self.branch.abspath(path))
375
        if len(previous_entries) == 1:
376
            # cannot be unchanged unless there is only one parent file rev.
377
            parent_ie = previous_entries.values()[0]
378
            unchanged = ie.unchanged(parent_ie, self.work_tree)
379
            if unchanged:
380
                mutter("found unchanged entry")
381
                ie.revision = parent_ie.revision
382
                self.report_entry_status(previous_entries, path, ie)
383
                return 
384
        mutter('new revision for {%s}', ie.file_id)
385
        ie.revision = self.rev_id
386
        if ie.kind != 'file':
387
            self.report_entry_status(previous_entries, path, ie)
388
            return
389
        # file is either new, or a file merge; need to record
390
        # a new version
391
        self.report_entry_status(previous_entries, path, ie)
392
        #if not unchanged:
393
        self._commit_file(ie, previous_entries)
394
395
    def report_entry_status(self, previous_entries, path, ie):
396
        if len(previous_entries) > 1:
397
            note('merged %s', path)
398
        elif len(previous_entries) == 0:
399
            note('added %s', path)
400
        elif ie.revision == self.rev_id:
401
            note('modified/renamed/reparented%s', path)
402
        else:
403
            note('unchanged %s', path)
404
405
    def _store_snapshot(self):
406
        """Pass over inventory and record a snapshot.
1303 by Martin Pool
- commit updates entry_version
407
1092.2.21 by Robert Collins
convert name_version to revision in inventory entries
408
        Entries get a new revision when they are modified in 
409
        any way, which includes a merge with a new set of
410
        parents that have the same entry. Currently we do not
411
        check for that set being ancestors of each other - and
412
        we should - only parallel children should count for this
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
413
        test see find_entry_parents to correct this. FIXME <---
414
        I.e. if we are merging in revision FOO, and our
1092.2.21 by Robert Collins
convert name_version to revision in inventory entries
415
        copy of file id BAR is identical to FOO.BAR, we should
416
        generate a new revision of BAR IF and only IF FOO is
417
        neither a child of our current tip, nor an ancestor of
418
        our tip. The presence of FOO in our store should not 
419
        affect this logic UNLESS we are doing a merge of FOO,
420
        or a child of FOO.
421
        """
1303 by Martin Pool
- commit updates entry_version
422
        # XXX: Need to think more here about when the user has
423
        # made a specific decision on a particular value -- c.f.
424
        # mark-merge.  
425
        for path, ie in self.new_inv.iter_entries():
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
426
            previous_entries = self._find_entry_parents(ie. file_id)
427
            self._snapshot_entry(path, ie, previous_entries)
428
429
    def _populate_new_inv(self):
430
        """Build revision inventory.
431
432
        This creates a new empty inventory. Depending on
433
        which files are selected for commit, and what is present in the
434
        current tree, the new inventory is populated. inventory entries 
435
        which are candidates for modification have their revision set to
436
        None; inventory entries that are carried over untouched have their
437
        revision set to their prior value.
1301 by Martin Pool
- more docs in commit code
438
        """
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
439
        mutter("Selecting files for commit with filter %s", self.specific_files)
440
        self.new_inv = Inventory()
1249 by Martin Pool
- improvements to weave commit [broken]
441
        for path, new_ie in self.work_inv.iter_entries():
442
            file_id = new_ie.file_id
443
            mutter('check %s {%s}', path, new_ie.file_id)
1248 by Martin Pool
- new weave based cleanup [broken]
444
            if self.specific_files:
445
                if not is_inside_any(self.specific_files, path):
1249 by Martin Pool
- improvements to weave commit [broken]
446
                    mutter('%s not selected for commit', path)
447
                    self._carry_file(file_id)
448
                    continue
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
449
            mutter('%s selected for commit', path)
450
            ie = new_ie.copy()
451
            ie.revision = None
452
            self.new_inv.add(ie)
1249 by Martin Pool
- improvements to weave commit [broken]
453
454
    def _carry_file(self, file_id):
1285 by Martin Pool
- fix bug in committing files that are renamed but not modified
455
        """Carry the file unchanged from the basis revision."""
1249 by Martin Pool
- improvements to weave commit [broken]
456
        if self.basis_inv.has_id(file_id):
457
            self.new_inv.add(self.basis_inv[file_id].copy())
1248 by Martin Pool
- new weave based cleanup [broken]
458
459
    def _report_deletes(self):
460
        for file_id in self.basis_inv:
461
            if file_id not in self.new_inv:
462
                note('deleted %s', self.basis_inv.id2path(file_id))
463
1092.2.22 by Robert Collins
text_version and name_version unification looking reasonable
464
    def _commit_file(self, new_ie, file_parents):                    
465
        mutter('storing file {%s} in revision {%s}',
466
               new_ie.file_id, new_ie.revision)
467
        # special case to avoid diffing on renames or 
468
        # reparenting
469
        if (len(file_parents) == 1
470
            and new_ie.text_sha1 == file_parents.values()[0].text_sha1
471
            and new_ie.text_size == file_parents.values()[0].text_size):
472
            previous_ie = file_parents.values()[0]
473
            self.weave_store.add_identical_text(
474
                new_ie.file_id, previous_ie.revision, 
475
                new_ie.revision, file_parents)
476
        else:
477
            new_lines = self.work_tree.get_file(new_ie.file_id).readlines()
478
            self._add_text_to_weave(new_ie.file_id, new_lines, file_parents)
479
            new_ie.text_sha1 = sha_strings(new_lines)
480
            new_ie.text_size = sum(map(len, new_lines))
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
481
1199 by Martin Pool
- weave commit records per-file ancestors
482
    def _add_text_to_weave(self, file_id, new_lines, parents):
1248 by Martin Pool
- new weave based cleanup [broken]
483
        self.weave_store.add_text(file_id, self.rev_id, new_lines, parents)
1189 by Martin Pool
- BROKEN: partial support for commit into weave
484
485
def _gen_revision_id(branch, when):
486
    """Return new revision-id."""
487
    s = '%s-%s-' % (user_email(branch), compact_date(when))
488
    s += hexlify(rand_bytes(8))
489
    return s
633 by Martin Pool
- Show added/renamed/modified messages from commit for non-file
490
1248 by Martin Pool
- new weave based cleanup [broken]
491
492
493
    
1333 by Martin Pool
- split out merge-ancestry stuff where it can be reused
494
def merge_ancestry_lines(rev_id, ancestries):
495
    """Return merged ancestry lines.
496
497
    rev_id -- id of the new revision
498
    
499
    ancestries -- a sequence of ancestries for parent revisions,
500
        as newline-terminated line lists.
501
    """
502
    if len(ancestries) == 0:
503
        return [rev_id + '\n']
504
    seen = set(ancestries[0])
505
    ancs = ancestries[0][:]    
506
    for parent_ancestry in ancestries[1:]:
507
        for line in parent_ancestry:
508
            assert line[-1] == '\n'
509
            if line not in seen:
510
                ancs.append(line)
511
                seen.add(line)
512
    r = rev_id + '\n'
513
    assert r not in seen
514
    ancs.append(r)
515
    return ancs