1
# Copyright (C) 2004, 2005, 2006, 2007 Canonical Ltd
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11
# GNU General Public License for more details.
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
"""File annotate based on weave storage"""
19
# TODO: Choice of more or less verbose formats:
21
# interposed: show more details between blocks of modified lines
23
# TODO: Show which revision caused a line to merge into the parent
25
# TODO: perhaps abbreviate timescales depending on how recent they are
26
# e.g. "3:12 Tue", "13 Oct", "Oct 2005", etc.
37
from bzrlib.config import extract_email_address
40
def annotate_file(branch, rev_id, file_id, verbose=False, full=False,
41
to_file=None, show_ids=False):
42
"""Annotate file_id at revision rev_id in branch.
44
The branch should already be read_locked() when annotate_file is called.
46
:param branch: The branch to look for revision numbers and history from.
47
:param rev_id: The revision id to annotate.
48
:param file_id: The file_id to annotate.
49
:param verbose: Show all details rather than truncating to ensure
50
reasonable text width.
51
:param full: XXXX Not sure what this does.
52
:param to_file: The file to output the annotation to; if None stdout is
54
:param show_ids: Show revision ids in the annotation output.
59
# Handle the show_ids case
62
annotations = _annotations(branch.repository, file_id, rev_id)
63
max_origin_len = max(len(origin) for origin, text in annotations)
64
for origin, text in annotations:
65
if full or last_rev_id != origin:
69
to_file.write('%*s | %s' % (max_origin_len, this, text))
73
# Calculate the lengths of the various columns
74
annotation = list(_annotate_file(branch, rev_id, file_id))
75
if len(annotation) == 0:
76
max_origin_len = max_revno_len = max_revid_len = 0
78
max_origin_len = max(len(x[1]) for x in annotation)
79
max_revno_len = max(len(x[0]) for x in annotation)
80
max_revid_len = max(len(x[3]) for x in annotation)
82
max_revno_len = min(max_revno_len, 12)
83
max_revno_len = max(max_revno_len, 3)
85
# Output the annotations
87
encoding = getattr(to_file, 'encoding', None) or \
88
osutils.get_terminal_encoding()
89
for (revno_str, author, date_str, line_rev_id, text) in annotation:
91
anno = '%-*s %-*s %8s ' % (max_revno_len, revno_str,
92
max_origin_len, author, date_str)
94
if len(revno_str) > max_revno_len:
95
revno_str = revno_str[:max_revno_len-1] + '>'
96
anno = "%-*s %-7s " % (max_revno_len, revno_str, author[:7])
97
if anno.lstrip() == "" and full:
101
except UnicodeEncodeError:
102
# cmd_annotate should be passing in an 'exact' object, which means
103
# we have a direct handle to sys.stdout or equivalent. It may not
104
# be able to handle the exact Unicode characters, but 'annotate' is
105
# a user function (non-scripting), so shouldn't die because of
106
# unrepresentable annotation characters. So encode using 'replace',
107
# and write them again.
108
to_file.write(anno.encode(encoding, 'replace'))
109
to_file.write('| %s\n' % (text,))
113
def _annotations(repo, file_id, rev_id):
114
"""Return the list of (origin,text) for a revision of a file in a repository."""
115
w = repo.weave_store.get_weave(file_id, repo.get_transaction())
116
return list(w.annotate_iter(rev_id))
119
def _annotate_file(branch, rev_id, file_id):
120
"""Yield the origins for each line of a file.
122
This includes detailed information, such as the author name, and
123
date string for the commit, rather than just the revision id.
125
revision_id_to_revno = branch.get_revision_id_to_revno_map()
126
annotations = _annotations(branch.repository, file_id, rev_id)
128
revision_ids = set(o for o, t in annotations)
129
revision_ids = [o for o in revision_ids if
130
branch.repository.has_revision(o)]
131
revisions = dict((r.revision_id, r) for r in
132
branch.repository.get_revisions(revision_ids))
133
for origin, text in annotations:
134
text = text.rstrip('\r\n')
135
if origin == last_origin:
136
(revno_str, author, date_str) = ('','','')
139
if origin not in revisions:
140
(revno_str, author, date_str) = ('?','?','?')
142
revno_str = '.'.join(str(i) for i in
143
revision_id_to_revno[origin])
144
rev = revisions[origin]
145
tz = rev.timezone or 0
146
date_str = time.strftime('%Y%m%d',
147
time.gmtime(rev.timestamp + tz))
148
# a lazy way to get something like the email address
149
# TODO: Get real email address
150
author = rev.get_apparent_author()
152
author = extract_email_address(author)
153
except errors.NoEmailInUsername:
154
pass # use the whole name
155
yield (revno_str, author, date_str, origin, text)
158
def reannotate(parents_lines, new_lines, new_revision_id,
159
_left_matching_blocks=None,
160
heads_provider=None):
161
"""Create a new annotated version from new lines and parent annotations.
163
:param parents_lines: List of annotated lines for all parents
164
:param new_lines: The un-annotated new lines
165
:param new_revision_id: The revision-id to associate with new lines
166
(will often be CURRENT_REVISION)
167
:param left_matching_blocks: a hint about which areas are common
168
between the text and its left-hand-parent. The format is
169
the SequenceMatcher.get_matching_blocks format
170
(start_left, start_right, length_of_match).
171
:param heads_provider: An object which provids a .heads() call to resolve
172
if any revision ids are children of others.
173
If None, then any ancestry disputes will be resolved with
176
if len(parents_lines) == 0:
177
lines = [(new_revision_id, line) for line in new_lines]
178
elif len(parents_lines) == 1:
179
lines = _reannotate(parents_lines[0], new_lines, new_revision_id,
180
_left_matching_blocks)
181
elif len(parents_lines) == 2:
182
left = _reannotate(parents_lines[0], new_lines, new_revision_id,
183
_left_matching_blocks)
184
lines = _reannotate_annotated(parents_lines[1], new_lines,
185
new_revision_id, left,
188
reannotations = [_reannotate(parents_lines[0], new_lines,
189
new_revision_id, _left_matching_blocks)]
190
reannotations.extend(_reannotate(p, new_lines, new_revision_id)
191
for p in parents_lines[1:])
193
for annos in zip(*reannotations):
194
origins = set(a for a, l in annos)
195
if len(origins) == 1:
196
# All the parents agree, so just return the first one
197
lines.append(annos[0])
200
if len(origins) == 2 and new_revision_id in origins:
201
origins.remove(new_revision_id)
202
if len(origins) == 1:
203
lines.append((origins.pop(), line))
205
lines.append((new_revision_id, line))
209
def _reannotate(parent_lines, new_lines, new_revision_id,
210
matching_blocks=None):
212
if matching_blocks is None:
213
plain_parent_lines = [l for r, l in parent_lines]
214
matcher = patiencediff.PatienceSequenceMatcher(None,
215
plain_parent_lines, new_lines)
216
matching_blocks = matcher.get_matching_blocks()
218
for i, j, n in matching_blocks:
219
for line in new_lines[new_cur:j]:
220
lines.append((new_revision_id, line))
221
lines.extend(parent_lines[i:i+n])
226
def _reannotate_annotated(right_parent_lines, new_lines, new_revision_id,
227
annotated_lines, heads_provider):
228
"""Update the annotations for a node based on another parent.
230
:param right_parent_lines: A list of annotated lines for the right-hand
232
:param new_lines: The unannotated new lines.
233
:param new_revision_id: The revision_id to attribute to lines which are not
234
present in either parent.
235
:param annotated_lines: A list of annotated lines. This should be the
236
annotation of new_lines based on parents seen so far.
237
:param heads_provider: When parents disagree on the lineage of a line, we
238
need to check if one side supersedes the other.
240
def get_matching_blocks(old, new):
241
matcher = patiencediff.PatienceSequenceMatcher(None,
243
return matcher.get_matching_blocks()
245
assert len(new_lines) == len(annotated_lines)
246
# First compare the newly annotated lines with the right annotated lines.
247
# Lines which were not changed in left or right should match. This tends to
248
# be the bulk of the lines, and they will need no further processing.
249
matching_left_and_right = get_matching_blocks(right_parent_lines,
252
lines_append = lines.append
253
lines_extend = lines.extend
254
last_i = 0 # The line just after the last match from the right side
256
for i, j, n in matching_left_and_right:
257
# annotated lines from last_j to j did not match the lines from last_i
258
# to i, the raw lines should be compared to determine what annotations
260
if last_i == i or last_j == j:
261
# One of the sides is empty, so this is a pure insertion
262
lines_extend(annotated_lines[last_j:j])
264
# We need to see if any of the unannotated lines match
265
plain_right_lines = [l for r,l in right_parent_lines[last_i:i]]
267
for ii, jj, nn in get_matching_blocks(plain_right_lines,
268
new_lines[last_j:j]):
269
# All the lines that don't match are just passed along
270
lines_extend(annotated_lines[last_j+last_jj:last_j+jj])
271
for offset in xrange(nn):
272
left = annotated_lines[last_j+jj+offset]
273
right = right_parent_lines[last_i+ii+offset]
274
if left[0] == right[0]:
275
# The annotations match, just return the left one
277
elif left[0] == new_revision_id:
278
# The left parent marked this as unmatched, so let the
279
# right parent claim it
282
# Left and Right both claim this line
283
if heads_provider is None:
284
lines_append((new_revision_id, left[1]))
286
heads = heads_provider.heads((left[0], right[0]))
288
lines_append((heads.pop(), left[1]))
290
# Both claim different origins
291
lines_append((new_revision_id, left[1]))
295
# If left and right agree on a range, just push that into the output
296
assert len(lines) == j
297
lines_extend(annotated_lines[j:j+n])