/brz/remove-bazaar : revision 7290.1.45

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to breezy/_patiencediff_py.py

Committer: Jelmer Vernooĳ
Date: 2019-12-23 01:39:21 UTC
mfrom: (7424 work)
mto: This revision was merged to the branch mainline in revision 7425.
Revision ID: jelmer@jelmer.uk-20191223013921-2kzd0wlcoylgxksk

Merge trunk.

files added:
.gitignore

breezy/bedding.py

breezy/bzr/bundle

breezy/mergeable.py

breezy/multiwalker.py

breezy/plugins/flake8

breezy/plugins/flake8/__init__.py

breezy/plugins/fossil

breezy/plugins/fossil/__init__.py

breezy/plugins/quilt

breezy/plugins/quilt/__init__.py

breezy/plugins/quilt/merge.py

breezy/plugins/quilt/quilt.py

breezy/plugins/quilt/tests

breezy/plugins/quilt/tests/__init__.py

breezy/plugins/quilt/tests/test_merge.py

breezy/plugins/quilt/tests/test_wrapper.py

breezy/plugins/quilt/wrapper.py

breezy/plugins/stats/test_blackbox.py

breezy/plugins/zsh_completion

breezy/plugins/zsh_completion/__init__.py

breezy/plugins/zsh_completion/tests

breezy/plugins/zsh_completion/tests/__init__.py

breezy/plugins/zsh_completion/tests/test_zshcomp.py

breezy/plugins/zsh_completion/zshcomp.py

breezy/tests/blackbox/test_big_file.py

breezy/tests/blackbox/test_patch.py

breezy/tests/blackbox/test_resolve_location.py

breezy/tests/test_bedding.py

breezy/tests/test_mergeable.py

breezy/tests/test_multiwalker.py

doc/en/release-notes/brz-3.1.txt

doc/en/whats-new/whats-new-in-3.1.txt

files removed:
breezy/_patiencediff_c.c

breezy/_patiencediff_py.py

breezy/bundle

breezy/patiencediff.py

breezy/transport/http/_urllib2_wrappers.py

files renamed:
breezy/bundle/__init__.py => breezy/bzr/bundle/__init__.py

breezy/bundle/apply_bundle.py => breezy/bzr/bundle/apply_bundle.py

breezy/bundle/bundle_data.py => breezy/bzr/bundle/bundle_data.py

breezy/bundle/commands.py => breezy/bzr/bundle/commands.py

breezy/bundle/serializer/ => breezy/bzr/bundle/serializer/

files modified:
.bzrignore

.travis.yml

appveyor.yml

breezy/__init__.py

breezy/_annotator_py.py

breezy/annotate.py

breezy/branch.py

breezy/builtins.py

breezy/bzr/__init__.py

breezy/bzr/_btree_serializer_pyx.pyx

breezy/bzr/_chk_map_pyx.pyx

breezy/bzr/_dirstate_helpers_pyx.pyx

breezy/bzr/_knit_load_data_py.py

breezy/bzr/branch.py

breezy/bzr/bundle/serializer/__init__.py

breezy/bzr/bundle/serializer/v08.py

breezy/bzr/bundle/serializer/v09.py

breezy/bzr/bundle/serializer/v4.py

breezy/bzr/bzrdir.py

breezy/bzr/dirstate.py

breezy/bzr/fetch.py

breezy/bzr/groupcompress.py

breezy/bzr/groupcompress_repo.py

breezy/bzr/inventory.py

breezy/bzr/inventorytree.py

breezy/bzr/knit.py

breezy/bzr/pack_repo.py

breezy/bzr/remote.py

breezy/bzr/smart/medium.py

breezy/bzr/smart/request.py

breezy/bzr/versionedfile.py

breezy/bzr/vf_repository.py

breezy/bzr/weave.py

breezy/bzr/workingtree.py

breezy/bzr/workingtree_3.py

breezy/bzr/workingtree_4.py

breezy/check.py

breezy/cleanup.py

breezy/commands.py

breezy/commit.py

breezy/commit_signature_commands.py

breezy/config.py

breezy/conflicts.py

breezy/controldir.py

breezy/crash.py

breezy/delta.py

breezy/diff.py

breezy/directory_service.py

breezy/errors.py

breezy/fetch_ghosts.py

breezy/git/__init__.py

breezy/git/branch.py

breezy/git/cache.py

breezy/git/commands.py

breezy/git/commit.py

breezy/git/dir.py

breezy/git/errors.py

breezy/git/fetch.py

breezy/git/interrepo.py

breezy/git/mapping.py

breezy/git/memorytree.py

breezy/git/object_store.py

breezy/git/remote.py

breezy/git/repository.py

breezy/git/revspec.py

breezy/git/roundtrip.py

breezy/git/send.py

breezy/git/tests/test_blackbox.py

breezy/git/tests/test_dir.py

breezy/git/tests/test_mapping.py

breezy/git/tests/test_memorytree.py

breezy/git/tests/test_remote.py

breezy/git/tests/test_repository.py

breezy/git/tests/test_roundtrip.py

breezy/git/tests/test_transportgit.py

breezy/git/tests/test_urls.py

breezy/git/tests/test_workingtree.py

breezy/git/transportgit.py

breezy/git/tree.py

breezy/git/unpeel_map.py

breezy/git/urls.py

breezy/git/workingtree.py

breezy/gpg.py

breezy/help_topics/__init__.py

breezy/help_topics/en/configuration.txt

breezy/help_topics/en/missing-extensions.txt

breezy/ignores.py

breezy/info.py

breezy/library_state.py

breezy/location.py

breezy/lock.py

breezy/lockdir.py

breezy/log.py

breezy/mail_client.py

breezy/memorytree.py

breezy/merge.py

breezy/merge3.py

breezy/merge_directive.py

breezy/missing.py

breezy/msgeditor.py

breezy/multiparent.py

breezy/mutabletree.py

breezy/option.py

breezy/osutils.py

breezy/patch.py

breezy/plugin.py

breezy/plugins/bash_completion/tests/test_bashcomp.py

breezy/plugins/changelog_merge/tests/test_changelog_merge.py

breezy/plugins/commitfromnews/committemplate.py

breezy/plugins/cvs/__init__.py

breezy/plugins/darcs/__init__.py

breezy/plugins/email/emailer.py

breezy/plugins/fastimport/bzr_commit_handler.py

breezy/plugins/fastimport/exporter.py

breezy/plugins/fastimport/helpers.py

breezy/plugins/fastimport/revision_store.py

breezy/plugins/fastimport/tests/test_generic_processor.py

breezy/plugins/fastimport/tests/test_revision_store.py

breezy/plugins/launchpad/lp_api.py

breezy/plugins/launchpad/lp_directory.py

breezy/plugins/launchpad/lp_propose.py

breezy/plugins/launchpad/lp_registration.py

breezy/plugins/launchpad/test_lp_api.py

breezy/plugins/mtn/__init__.py

breezy/plugins/propose/__init__.py

breezy/plugins/propose/cmds.py

breezy/plugins/propose/github.py

breezy/plugins/propose/gitlabs.py

breezy/plugins/propose/launchpad.py

breezy/plugins/propose/propose.py

breezy/plugins/repodebug/check_chk.py

breezy/plugins/repodebug/missing_keys_for_stacking_fixer.py

breezy/plugins/stats/__init__.py

breezy/plugins/stats/classify.py

breezy/plugins/stats/cmds.py

breezy/plugins/upload/cmds.py

breezy/plugins/upload/tests/test_upload.py

breezy/plugins/weave_fmt/bzrdir.py

breezy/plugins/weave_fmt/test_bzrdir.py

breezy/plugins/weave_fmt/test_repository.py

breezy/plugins/weave_fmt/workingtree.py

breezy/push.py

breezy/reconcile.py

breezy/reconfigure.py

breezy/rename_map.py

breezy/repository.py

breezy/revisionspec.py

breezy/rules.py

breezy/send.py

breezy/shelf.py

breezy/shelf_ui.py

breezy/status.py

breezy/tag.py

breezy/tests/__init__.py

breezy/tests/blackbox/__init__.py

breezy/tests/blackbox/test_annotate.py

breezy/tests/blackbox/test_branches.py

breezy/tests/blackbox/test_commit.py

breezy/tests/blackbox/test_diff.py

breezy/tests/blackbox/test_export.py

breezy/tests/blackbox/test_info.py

breezy/tests/blackbox/test_inventory.py

breezy/tests/blackbox/test_join.py

breezy/tests/blackbox/test_logformats.py

breezy/tests/blackbox/test_push.py

breezy/tests/blackbox/test_reconcile.py

breezy/tests/blackbox/test_reconfigure.py

breezy/tests/blackbox/test_remove.py

breezy/tests/blackbox/test_revision_history.py

breezy/tests/blackbox/test_send.py

breezy/tests/blackbox/test_shared_repository.py

breezy/tests/blackbox/test_status.py

breezy/tests/blackbox/test_switch.py

breezy/tests/blackbox/test_upgrade.py

breezy/tests/blackbox/test_version.py

breezy/tests/blackbox/test_versioning.py

breezy/tests/blackbox/test_whoami.py

breezy/tests/commands/test_init_repository.py

breezy/tests/features.py

breezy/tests/per_branch/test_branch.py

breezy/tests/per_branch/test_commit.py

breezy/tests/per_branch/test_get_revision_id_to_revno_map.py

breezy/tests/per_branch/test_push.py

breezy/tests/per_branch/test_sprout.py

breezy/tests/per_branch/test_stacking.py

breezy/tests/per_controldir/test_controldir.py

breezy/tests/per_interrepository/test_fetch.py

breezy/tests/per_interrepository/test_interrepository.py

breezy/tests/per_intertree/test_compare.py

breezy/tests/per_inventory/basics.py

breezy/tests/per_merger.py

breezy/tests/per_pack_repository.py

breezy/tests/per_repository/test_check.py

breezy/tests/per_repository/test_commit_builder.py

breezy/tests/per_repository/test_repository.py

breezy/tests/per_repository/test_signatures.py

breezy/tests/per_repository/test_write_group.py

breezy/tests/per_repository_chk/test_supported.py

breezy/tests/per_repository_reference/test_add_inventory.py

breezy/tests/per_repository_reference/test_add_revision.py

breezy/tests/per_repository_reference/test_add_signature_text.py

breezy/tests/per_repository_vf/helpers.py

breezy/tests/per_repository_vf/test_check.py

breezy/tests/per_repository_vf/test_check_reconcile.py

breezy/tests/per_repository_vf/test_fileid_involved.py

breezy/tests/per_repository_vf/test_reconcile.py

breezy/tests/per_repository_vf/test_repository.py

breezy/tests/per_tree/__init__.py

breezy/tests/per_tree/test_get_root_id.py

breezy/tests/per_tree/test_ids.py

breezy/tests/per_tree/test_path_content_summary.py

breezy/tests/per_tree/test_symlinks.py

breezy/tests/per_tree/test_test_trees.py

breezy/tests/per_tree/test_tree.py

breezy/tests/per_versionedfile.py

breezy/tests/per_workingtree/test_add.py

breezy/tests/per_workingtree/test_add_reference.py

breezy/tests/per_workingtree/test_changes_from.py

breezy/tests/per_workingtree/test_commit.py

breezy/tests/per_workingtree/test_executable.py

breezy/tests/per_workingtree/test_flush.py

breezy/tests/per_workingtree/test_inv.py

breezy/tests/per_workingtree/test_is_ignored.py

breezy/tests/per_workingtree/test_locking.py

breezy/tests/per_workingtree/test_merge_from_branch.py

breezy/tests/per_workingtree/test_nested_specifics.py

breezy/tests/per_workingtree/test_pull.py

breezy/tests/per_workingtree/test_rename_one.py

breezy/tests/per_workingtree/test_set_root_id.py

breezy/tests/per_workingtree/test_walkdirs.py

breezy/tests/per_workingtree/test_workingtree.py

breezy/tests/test__dirstate_helpers.py

breezy/tests/test_branch.py

breezy/tests/test_branchbuilder.py

breezy/tests/test_bundle.py

breezy/tests/test_bzrdir.py

breezy/tests/test_cleanup.py

breezy/tests/test_commit.py

breezy/tests/test_commit_merge.py

breezy/tests/test_config.py

breezy/tests/test_controldir.py

breezy/tests/test_crash.py

breezy/tests/test_delta.py

breezy/tests/test_diff.py

breezy/tests/test_dirstate.py

breezy/tests/test_errors.py

breezy/tests/test_extract.py

breezy/tests/test_fetch.py

breezy/tests/test_http.py

breezy/tests/test_http_response.py

breezy/tests/test_https_urllib.py

breezy/tests/test_ignores.py

breezy/tests/test_import_tariff.py

breezy/tests/test_inv.py

breezy/tests/test_knit.py

breezy/tests/test_location.py

breezy/tests/test_lockdir.py

breezy/tests/test_log.py

breezy/tests/test_matchers.py

breezy/tests/test_memorytree.py

breezy/tests/test_merge.py

breezy/tests/test_merge_core.py

breezy/tests/test_missing.py

breezy/tests/test_multiparent.py

breezy/tests/test_options.py

breezy/tests/test_osutils.py

breezy/tests/test_patch.py

breezy/tests/test_read_bundle.py

breezy/tests/test_remote.py

breezy/tests/test_revert.py

breezy/tests/test_revisiontree.py

breezy/tests/test_rules.py

breezy/tests/test_shelf.py

breezy/tests/test_shelf_ui.py

breezy/tests/test_smart_add.py

breezy/tests/test_smart_transport.py

breezy/tests/test_ssh_transport.py

breezy/tests/test_subsume.py

breezy/tests/test_switch.py

breezy/tests/test_testament.py

breezy/tests/test_trace.py

breezy/tests/test_transform.py

breezy/tests/test_transport.py

breezy/tests/test_tree.py

breezy/tests/test_win32utils.py

breezy/tests/test_workingtree.py

breezy/tests/test_workingtree_4.py

breezy/textmerge.py

breezy/trace.py

breezy/transform.py

breezy/transport/__init__.py

breezy/transport/http/__init__.py

breezy/transport/http/response.py

breezy/transport/local.py

breezy/transport/log.py

breezy/transport/remote.py

breezy/transport/ssh.py

breezy/tree.py

breezy/upgrade.py

breezy/upstream_import.py

breezy/urlutils.py

breezy/version.py

breezy/version_info_formats/__init__.py

breezy/win32utils.py

breezy/workingtree.py

byov.conf

doc/developers/HACKING.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/contribution-quickstart.txt

doc/developers/development-repo.txt

doc/developers/integration.txt

doc/developers/packrepo.txt

doc/developers/profiling.txt

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/simple-setups.txt

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/release-notes/brz-3.0.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/whats-new/template.txt

setup.py

tools/testr-run.py

tools/time_graph.py

tools/win32/build_release.py

Show diffs side-by-side

added added

removed removed

breezy/_patiencediff_py.py

#!/usr/bin/env python

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

from __future__ import absolute_import

from bisect import bisect

import difflib

from .trace import mutter

def unique_lcs_py(a, b):

"""Find the longest common subset for unique lines.

:param a: An indexable object (such as string or list of strings)

:param b: Another indexable object (such as string or list of strings)

:return: A list of tuples, one for each line which is matched.

[(line_in_a, line_in_b), ...]

This only matches lines which are unique on both sides.

This helps prevent common lines from over influencing match

results.

The longest common subset uses the Patience Sorting algorithm:

http://en.wikipedia.org/wiki/Patience_sorting

"""

# set index[line in a] = position of line in a unless

# a is a duplicate, in which case it's set to None

index = {}

for i, line in enumerate(a):

if line in index:

index[line] = None

else:

index[line] = i

# make btoa[i] = position of line i in a, unless

# that line doesn't occur exactly once in both,

# in which case it's set to None

btoa = [None] * len(b)

index2 = {}

for pos, line in enumerate(b):

next = index.get(line)

if next is not None:

if line in index2:

# unset the previous mapping, which we now know to

# be invalid because the line isn't unique

btoa[index2[line]] = None

del index[line]

else:

index2[line] = pos

btoa[pos] = next

# this is the Patience sorting algorithm

# see http://en.wikipedia.org/wiki/Patience_sorting

backpointers = [None] * len(b)

stacks = []

lasts = []

k = 0

for bpos, apos in enumerate(btoa):

if apos is None:

continue

# as an optimization, check if the next line comes at the end,

# because it usually does

if stacks and stacks[-1] < apos:

k = len(stacks)

# as an optimization, check if the next line comes right after

# the previous line, because usually it does

elif stacks and stacks[k] < apos and (k == len(stacks) - 1 or

stacks[k + 1] > apos):

k += 1

else:

k = bisect(stacks, apos)

if k > 0:

backpointers[bpos] = lasts[k - 1]

if k < len(stacks):

stacks[k] = apos

lasts[k] = bpos

else:

stacks.append(apos)

lasts.append(bpos)

if len(lasts) == 0:

return []

result = []

k = lasts[-1]

while k is not None:

result.append((btoa[k], k))

k = backpointers[k]

result.reverse()

100

return result

101

102

103

def recurse_matches_py(a, b, alo, blo, ahi, bhi, answer, maxrecursion):

104

"""Find all of the matching text in the lines of a and b.

105

106

:param a: A sequence

107

:param b: Another sequence

108

:param alo: The start location of a to check, typically 0

109

:param ahi: The start location of b to check, typically 0

110

:param ahi: The maximum length of a to check, typically len(a)

111

:param bhi: The maximum length of b to check, typically len(b)

112

:param answer: The return array. Will be filled with tuples

113

indicating [(line_in_a, line_in_b)]

114

:param maxrecursion: The maximum depth to recurse.

115

Must be a positive integer.

116

:return: None, the return value is in the parameter answer, which

117

should be a list

118

119

"""

120

if maxrecursion < 0:

121

mutter('max recursion depth reached')

122

# this will never happen normally, this check is to prevent DOS attacks

123

return

124

oldlength = len(answer)

125

if alo == ahi or blo == bhi:

126

return

127

last_a_pos = alo - 1

128

last_b_pos = blo - 1

129

for apos, bpos in unique_lcs_py(a[alo:ahi], b[blo:bhi]):

130

# recurse between lines which are unique in each file and match

131

apos += alo

132

bpos += blo

133

# Most of the time, you will have a sequence of similar entries

134

if last_a_pos + 1 != apos or last_b_pos + 1 != bpos:

135

recurse_matches_py(

136

a, b, last_a_pos + 1, last_b_pos + 1, apos, bpos, answer,

137

maxrecursion - 1)

138

last_a_pos = apos

139

last_b_pos = bpos

140

answer.append((apos, bpos))

141

if len(answer) > oldlength:

142

# find matches between the last match and the end

143

recurse_matches_py(a, b, last_a_pos + 1, last_b_pos + 1,

144

ahi, bhi, answer, maxrecursion - 1)

145

elif a[alo] == b[blo]:

146

# find matching lines at the very beginning

147

while alo < ahi and blo < bhi and a[alo] == b[blo]:

148

answer.append((alo, blo))

149

alo += 1

150

blo += 1

151

recurse_matches_py(a, b, alo, blo,

152

ahi, bhi, answer, maxrecursion - 1)

153

elif a[ahi - 1] == b[bhi - 1]:

154

# find matching lines at the very end

155

nahi = ahi - 1

156

nbhi = bhi - 1

157

while nahi > alo and nbhi > blo and a[nahi - 1] == b[nbhi - 1]:

158

nahi -= 1

159

nbhi -= 1

160

recurse_matches_py(a, b, last_a_pos + 1, last_b_pos + 1,

161

nahi, nbhi, answer, maxrecursion - 1)

162

for i in range(ahi - nahi):

163

answer.append((nahi + i, nbhi + i))

164

165

166

def _collapse_sequences(matches):

167

"""Find sequences of lines.

168

169

Given a sequence of [(line_in_a, line_in_b),]

170

find regions where they both increment at the same time

171

"""

172

answer = []

173

start_a = start_b = None

174

length = 0

175

for i_a, i_b in matches:

176

if (start_a is not None

177

and (i_a == start_a + length)

178

and (i_b == start_b + length)):

179

length += 1

180

else:

181

if start_a is not None:

182

answer.append((start_a, start_b, length))

183

start_a = i_a

184

start_b = i_b

185

length = 1

186

187

if length != 0:

188

answer.append((start_a, start_b, length))

189

190

return answer

191

192

193

def _check_consistency(answer):

194

# For consistency sake, make sure all matches are only increasing

195

next_a = -1

196

next_b = -1

197

for (a, b, match_len) in answer:

198

if a < next_a:

199

raise ValueError('Non increasing matches for a')

200

if b < next_b:

201

raise ValueError('Non increasing matches for b')

202

next_a = a + match_len

203

next_b = b + match_len

204

205

206

class PatienceSequenceMatcher_py(difflib.SequenceMatcher):

207

"""Compare a pair of sequences using longest common subset."""

208

209

_do_check_consistency = True

210

211

def __init__(self, isjunk=None, a='', b=''):

212

if isjunk is not None:

213

raise NotImplementedError('Currently we do not support'

214

' isjunk for sequence matching')

215

difflib.SequenceMatcher.__init__(self, isjunk, a, b)

216

217

def get_matching_blocks(self):

218

"""Return list of triples describing matching subsequences.

219

220

Each triple is of the form (i, j, n), and means that

221

a[i:i+n] == b[j:j+n]. The triples are monotonically increasing in

222

i and in j.

223

224

The last triple is a dummy, (len(a), len(b), 0), and is the only

225

triple with n==0.

226

227

>>> s = PatienceSequenceMatcher(None, "abxcd", "abcd")

228

>>> s.get_matching_blocks()

229

[(0, 0, 2), (3, 2, 2), (5, 4, 0)]

230

"""

231

# jam 20060525 This is the python 2.4.1 difflib get_matching_blocks

232

# implementation which uses __helper. 2.4.3 got rid of helper for

233

# doing it inline with a queue.

234

# We should consider doing the same for recurse_matches

235

236

if self.matching_blocks is not None:

237

return self.matching_blocks

238

239

matches = []

240

recurse_matches_py(self.a, self.b, 0, 0,

241

len(self.a), len(self.b), matches, 10)

242

# Matches now has individual line pairs of

243

# line A matches line B, at the given offsets

244

self.matching_blocks = _collapse_sequences(matches)

245

self.matching_blocks.append((len(self.a), len(self.b), 0))

246

if PatienceSequenceMatcher_py._do_check_consistency:

247

if __debug__:

248

_check_consistency(self.matching_blocks)

249

250

return self.matching_blocks

Older »