13
13
# You should have received a copy of the GNU General Public License
14
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
18
# mbp: "you know that thing where cvs gives you conflict markers?"
18
19
# s: "i hate that."
29
class CantReprocessAndShowBase(errors.BzrError):
31
_fmt = ("Can't reprocess and show base, because reprocessing obscures "
32
"the relationship of conflicting lines to the base")
22
from bzrlib.errors import CantReprocessAndShowBase
23
import bzrlib.patiencediff
24
from bzrlib.textfile import check_text_lines
35
27
def intersect(ra, rb):
57
50
def compare_range(a, astart, aend, b, bstart, bend):
58
51
"""Compare a[astart:aend] == b[bstart:bend], without slicing.
60
if (aend - astart) != (bend - bstart):
53
if (aend-astart) != (bend-bstart):
62
for ia, ib in zip(range(astart, aend), range(bstart, bend)):
55
for ia, ib in zip(xrange(astart, aend), xrange(bstart, bend)):
69
64
class Merge3(object):
72
67
Given BASE, OTHER, THIS, tries to produce a combined text
73
68
incorporating the changes from both BASE->OTHER and BASE->THIS.
74
69
All three will typically be sequences of lines."""
76
def __init__(self, base, a, b, is_cherrypick=False, allow_objects=False):
79
:param base: lines in BASE
82
:param is_cherrypick: flag indicating if this merge is a cherrypick.
83
When cherrypicking b => a, matches with b and base do not conflict.
84
:param allow_objects: if True, do not require that base, a and b are
85
plain Python strs. Also prevents BinaryFile from being raised.
86
Lines can be any sequence of comparable and hashable Python
90
textfile.check_text_lines(base)
91
textfile.check_text_lines(a)
92
textfile.check_text_lines(b)
70
def __init__(self, base, a, b):
71
check_text_lines(base)
96
self.is_cherrypick = is_cherrypick
98
80
def merge_lines(self,
102
start_marker=b'<<<<<<<',
103
mid_marker=b'=======',
104
end_marker=b'>>>>>>>',
84
start_marker='<<<<<<<',
107
89
"""Return merge in cvs-like form.
110
92
if len(self.a) > 0:
111
if self.a[0].endswith(b'\r\n'):
113
elif self.a[0].endswith(b'\r'):
93
if self.a[0].endswith('\r\n'):
95
elif self.a[0].endswith('\r'):
115
97
if base_marker and reprocess:
116
98
raise CantReprocessAndShowBase()
118
start_marker = start_marker + b' ' + name_a
100
start_marker = start_marker + ' ' + name_a
120
end_marker = end_marker + b' ' + name_b
102
end_marker = end_marker + ' ' + name_b
121
103
if name_base and base_marker:
122
base_marker = base_marker + b' ' + name_base
104
base_marker = base_marker + ' ' + name_base
123
105
merge_regions = self.merge_regions()
124
106
if reprocess is True:
125
107
merge_regions = self.reprocess_merge_regions(merge_regions)
240
231
# section a[0:ia] has been disposed of, etc
243
234
for zmatch, zend, amatch, aend, bmatch, bend in self.find_sync_regions():
235
#print 'match base [%d:%d]' % (zmatch, zend)
244
237
matchlen = zend - zmatch
247
# matchlen == (aend - amatch)
248
# matchlen == (bend - bmatch)
239
assert matchlen == (aend - amatch)
240
assert matchlen == (bend - bmatch)
249
242
len_a = amatch - ia
250
243
len_b = bmatch - ib
244
len_base = zmatch - iz
255
# print 'unmatched a=%d, b=%d' % (len_a, len_b)
249
#print 'unmatched a=%d, b=%d' % (len_a, len_b)
257
251
if len_a or len_b:
258
252
# try to avoid actually slicing the lists
253
equal_a = compare_range(self.a, ia, amatch,
254
self.base, iz, zmatch)
255
equal_b = compare_range(self.b, ib, bmatch,
256
self.base, iz, zmatch)
259
257
same = compare_range(self.a, ia, amatch,
260
258
self.b, ib, bmatch)
263
261
yield 'same', ia, amatch
262
elif equal_a and not equal_b:
263
yield 'b', ib, bmatch
264
elif equal_b and not equal_a:
265
yield 'a', ia, amatch
266
elif not equal_a and not equal_b:
267
yield 'conflict', iz, zmatch, ia, amatch, ib, bmatch
265
equal_a = compare_range(self.a, ia, amatch,
266
self.base, iz, zmatch)
267
equal_b = compare_range(self.b, ib, bmatch,
268
self.base, iz, zmatch)
269
if equal_a and not equal_b:
270
yield 'b', ib, bmatch
271
elif equal_b and not equal_a:
272
yield 'a', ia, amatch
273
elif not equal_a and not equal_b:
274
if self.is_cherrypick:
275
for node in self._refine_cherrypick_conflict(
276
iz, zmatch, ia, amatch,
280
yield ('conflict', iz, zmatch, ia, amatch, ib,
283
raise AssertionError(
284
"can't handle a=b=base but unmatched")
269
raise AssertionError("can't handle a=b=base but unmatched")
290
275
# if the same part of the base was deleted on both sides
291
276
# that's OK, we can just skip it.
295
# assert ia == amatch
296
# assert ib == bmatch
297
# assert iz == zmatch
299
284
yield 'unchanged', zmatch, zend
304
def _refine_cherrypick_conflict(self, zstart, zend, astart, aend, bstart,
306
"""When cherrypicking b => a, ignore matches with b and base."""
307
# Do not emit regions which match, only regions which do not match
308
matches = patiencediff.PatienceSequenceMatcher(
309
None, self.base[zstart:zend], self.b[bstart:bend]
310
).get_matching_blocks()
315
for base_idx, b_idx, match_len in matches:
316
conflict_b_len = b_idx - last_b_idx
317
if conflict_b_len == 0:
318
# There are no lines in b which conflict, so skip it
323
zstart + last_base_idx, zstart + base_idx,
324
aend, aend, bstart + last_b_idx, bstart + b_idx)
326
# The first conflict gets the a-range
328
yield ('conflict', zstart + last_base_idx, zstart +
330
astart, aend, bstart + last_b_idx, bstart + b_idx)
331
last_base_idx = base_idx + match_len
332
last_b_idx = b_idx + match_len
333
if last_base_idx != zend - zstart or last_b_idx != bend - bstart:
335
yield ('conflict', zstart + last_base_idx, zstart + base_idx,
336
aend, aend, bstart + last_b_idx, bstart + b_idx)
338
# The first conflict gets the a-range
340
yield ('conflict', zstart + last_base_idx, zstart + base_idx,
341
astart, aend, bstart + last_b_idx, bstart + b_idx)
343
yield ('conflict', zstart, zend, astart, aend, bstart, bend)
345
290
def reprocess_merge_regions(self, merge_regions):
346
291
"""Where there are conflict regions, remove the agreed lines.
348
Lines where both A and B have made the same changes are
293
Lines where both A and B have made the same changes are
351
296
for region in merge_regions:
355
300
type, iz, zmatch, ia, amatch, ib, bmatch = region
356
301
a_region = self.a[ia:amatch]
357
302
b_region = self.b[ib:bmatch]
358
matches = patiencediff.PatienceSequenceMatcher(
359
None, a_region, b_region).get_matching_blocks()
303
matches = bzrlib.patiencediff.PatienceSequenceMatcher(
304
None, a_region, b_region).get_matching_blocks()
362
307
for region_ia, region_ib, region_len in matches[:-1]:
367
312
if reg is not None:
369
yield 'same', region_ia, region_len + region_ia
314
yield 'same', region_ia, region_len+region_ia
370
315
next_a = region_ia + region_len
371
316
next_b = region_ib + region_len
372
317
reg = self.mismatch_region(next_a, amatch, next_b, bmatch)
373
318
if reg is not None:
377
def mismatch_region(next_a, region_ia, next_b, region_ib):
323
def mismatch_region(next_a, region_ia, next_b, region_ib):
378
324
if next_a < region_ia or next_b < region_ib:
379
325
return 'conflict', None, None, next_a, region_ia, next_b, region_ib
381
328
def find_sync_regions(self):
382
329
"""Return a list of sync regions, where both descendents match the base.
389
amatches = patiencediff.PatienceSequenceMatcher(
390
None, self.base, self.a).get_matching_blocks()
391
bmatches = patiencediff.PatienceSequenceMatcher(
392
None, self.base, self.b).get_matching_blocks()
336
amatches = bzrlib.patiencediff.PatienceSequenceMatcher(
337
None, self.base, self.a).get_matching_blocks()
338
bmatches = bzrlib.patiencediff.PatienceSequenceMatcher(
339
None, self.base, self.b).get_matching_blocks()
393
340
len_a = len(amatches)
394
341
len_b = len(bmatches)
410
357
# found a match of base[i[0], i[1]]; this may be less than
411
358
# the region that matches in either one
412
# assert intlen <= alen
413
# assert intlen <= blen
414
# assert abase <= intbase
415
# assert bbase <= intbase
359
assert intlen <= alen
360
assert intlen <= blen
361
assert abase <= intbase
362
assert bbase <= intbase
417
364
asub = amatch + (intbase - abase)
418
365
bsub = bmatch + (intbase - bbase)
419
366
aend = asub + intlen
420
367
bend = bsub + intlen
422
# assert self.base[intbase:intend] == self.a[asub:aend], \
423
# (self.base[intbase:intend], self.a[asub:aend])
424
# assert self.base[intbase:intend] == self.b[bsub:bend]
369
assert self.base[intbase:intend] == self.a[asub:aend], \
370
(self.base[intbase:intend], self.a[asub:aend])
372
assert self.base[intbase:intend] == self.b[bsub:bend]
426
374
sl.append((intbase, intend,
429
378
# advance whichever one ends first in the base text
430
379
if (abase + alen) < (bbase + blen):
435
384
intbase = len(self.base)
436
385
abase = len(self.a)
437
386
bbase = len(self.b)
442
393
def find_unconflicted(self):
443
394
"""Return a list of ranges in base that are not conflicted."""
444
am = patiencediff.PatienceSequenceMatcher(
445
None, self.base, self.a).get_matching_blocks()
446
bm = patiencediff.PatienceSequenceMatcher(
447
None, self.base, self.b).get_matching_blocks()
395
am = bzrlib.patiencediff.PatienceSequenceMatcher(
396
None, self.base, self.a).get_matching_blocks()
397
bm = bzrlib.patiencediff.PatienceSequenceMatcher(
398
None, self.base, self.b).get_matching_blocks()
471
422
# as for diff3 and meld the syntax is "MINE BASE OTHER"
472
with open(argv[1], 'rt') as f:
474
with open(argv[2], 'rt') as f:
476
with open(argv[3], 'rt') as f:
423
a = file(argv[1], 'rt').readlines()
424
base = file(argv[2], 'rt').readlines()
425
b = file(argv[3], 'rt').readlines()
479
427
m3 = Merge3(base, a, b)
481
# for sr in m3.find_sync_regions():
429
#for sr in m3.find_sync_regions():
484
432
# sys.stdout.writelines(m3.merge_lines(name_a=argv[1], name_b=argv[3]))