/brz/remove-bazaar : revision 1594.2.24

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/knit.py

Committer: Robert Collins
Date: 2006-03-09 03:27:52 UTC
mto: (1596.2.4 integration) (1594.3.1 versioned-file-performance)
mto: This revision was merged to the branch mainline in revision 1601.
Revision ID: robertc@robertcollins.net-20060309032752-3570fbe40bb2b7a2

Make use of the transaction finalisation warning support to implement in-knit caching.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py.moved

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

generate_docs.py

notes

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/knit.py

# Written by Martin Pool.

# Modified by Johan Rydberg <jrydberg@gnu.org>

# Modified by Robert Collins <robert.collins@canonical.com>

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Knit versionedfile implementation.

A knit is a versioned file implementation that supports efficient append only

updates.

Knit file layout:

lifeless: the data file is made up of "delta records". each delta record has a delta header

that contains; (1) a version id, (2) the size of the delta (in lines), and (3) the digest of

the -expanded data- (ie, the delta applied to the parent). the delta also ends with a

end-marker; simply "end VERSION"

delta can be line or full contents.a

... the 8's there are the index number of the annotation.

version robertc@robertcollins.net-20051003014215-ee2990904cc4c7ad 7 c7d23b2a5bd6ca00e8e266cec0ec228158ee9f9e

59,59,3

8 if ie.executable:

8 e.set('executable', 'yes')

130,130,2

8 if elt.get('executable') == 'yes':

8 ie.executable = True

end robertc@robertcollins.net-20051003014215-ee2990904cc4c7ad

whats in an index:

09:33 < jrydberg> lifeless: each index is made up of a tuple of; version id, options, position, size, parents

09:33 < jrydberg> lifeless: the parents are currently dictionary compressed

09:33 < jrydberg> lifeless: (meaning it currently does not support ghosts)

09:33 < lifeless> right

09:33 < jrydberg> lifeless: the position and size is the range in the data file

so the index sequence is the dictionary compressed sequence number used

in the deltas to provide line annotation

"""

# TODOS:

# 10:16 < lifeless> make partial index writes safe

# 10:16 < lifeless> implement 'knit.check()' like weave.check()

# 10:17 < lifeless> record known ghosts so we can detect when they are filled in rather than the current 'reweave

# always' approach.

# move sha1 out of the content so that join is faster at verifying parents

# record content length ?

from copy import copy

from cStringIO import StringIO

import difflib

from difflib import SequenceMatcher

from gzip import GzipFile

from itertools import izip

import os

import bzrlib

import bzrlib.errors as errors

from bzrlib.errors import FileExists, NoSuchFile, KnitError, \

InvalidRevisionId, KnitCorrupt, KnitHeaderError, \

RevisionNotPresent, RevisionAlreadyPresent

from bzrlib.trace import mutter

from bzrlib.osutils import contains_whitespace, contains_linebreaks, \

sha_strings

from bzrlib.versionedfile import VersionedFile, InterVersionedFile

from bzrlib.tsort import topo_sort

# TODO: Split out code specific to this format into an associated object.

# TODO: Can we put in some kind of value to check that the index and data

# files belong together?

# TODO: accomodate binaries, perhaps by storing a byte count

# TODO: function to check whole file

# TODO: atomically append data, then measure backwards from the cursor

# position after writing to work out where it was located. we may need to

# bypass python file buffering.

100

DATA_SUFFIX = '.knit'

101

INDEX_SUFFIX = '.kndx'

102

103

104

class KnitContent(object):

105

"""Content of a knit version to which deltas can be applied."""

106

107

def __init__(self, lines):

108

self._lines = lines

109

110

def annotate_iter(self):

111

"""Yield tuples of (origin, text) for each content line."""

112

for origin, text in self._lines:

113

yield origin, text

114

115

def annotate(self):

116

"""Return a list of (origin, text) tuples."""

117

return list(self.annotate_iter())

118

119

def apply_delta(self, delta):

120

"""Apply delta to this content."""

121

offset = 0

122

for start, end, count, lines in delta:

123

self._lines[offset+start:offset+end] = lines

124

offset = offset + (start - end) + count

125

126

def line_delta_iter(self, new_lines):

127

"""Generate line-based delta from new_lines to this content."""

128

new_texts = [text for origin, text in new_lines._lines]

129

old_texts = [text for origin, text in self._lines]

130

s = difflib.SequenceMatcher(None, old_texts, new_texts)

131

for op in s.get_opcodes():

132

if op[0] == 'equal':

133

continue

134

yield (op[1], op[2], op[4]-op[3], new_lines._lines[op[3]:op[4]])

135

136

def line_delta(self, new_lines):

137

return list(self.line_delta_iter(new_lines))

138

139

def text(self):

140

return [text for origin, text in self._lines]

141

142

143

class _KnitFactory(object):

144

"""Base factory for creating content objects."""

145

146

def make(self, lines, version):

147

num_lines = len(lines)

148

return KnitContent(zip([version] * num_lines, lines))

149

150

151

class KnitAnnotateFactory(_KnitFactory):

152

"""Factory for creating annotated Content objects."""

153

154

annotated = True

155

156

def parse_fulltext(self, content, version):

157

lines = []

158

for line in content:

159

origin, text = line.split(' ', 1)

160

lines.append((int(origin), text))

161

return KnitContent(lines)

162

163

def parse_line_delta_iter(self, lines):

164

while lines:

165

header = lines.pop(0)

166

start, end, c = [int(n) for n in header.split(',')]

167

contents = []

168

for i in range(c):

169

origin, text = lines.pop(0).split(' ', 1)

170

contents.append((int(origin), text))

171

yield start, end, c, contents

172

173

def parse_line_delta(self, lines, version):

174

return list(self.parse_line_delta_iter(lines))

175

176

def lower_fulltext(self, content):

177

return ['%d %s' % (o, t) for o, t in content._lines]

178

179

def lower_line_delta(self, delta):

180

out = []

181

for start, end, c, lines in delta:

182

out.append('%d,%d,%d\n' % (start, end, c))

183

for origin, text in lines:

184

out.append('%d %s' % (origin, text))

185

return out

186

187

188

class KnitPlainFactory(_KnitFactory):

189

"""Factory for creating plain Content objects."""

190

191

annotated = False

192

193

def parse_fulltext(self, content, version):

194

return self.make(content, version)

195

196

def parse_line_delta_iter(self, lines, version):

197

while lines:

198

header = lines.pop(0)

199

start, end, c = [int(n) for n in header.split(',')]

200

yield start, end, c, zip([version] * c, lines[:c])

201

del lines[:c]

202

203

def parse_line_delta(self, lines, version):

204

return list(self.parse_line_delta_iter(lines, version))

205

206

def lower_fulltext(self, content):

207

return content.text()

208

209

def lower_line_delta(self, delta):

210

out = []

211

for start, end, c, lines in delta:

212

out.append('%d,%d,%d\n' % (start, end, c))

213

out.extend([text for origin, text in lines])

214

return out

215

216

217

def make_empty_knit(transport, relpath):

218

"""Construct a empty knit at the specified location."""

219

k = KnitVersionedFile(transport, relpath, 'w', KnitPlainFactory)

220

k._data._open_file()

221

222

223

class KnitVersionedFile(VersionedFile):

224

"""Weave-like structure with faster random access.

225

226

A knit stores a number of texts and a summary of the relationships

227

between them. Texts are identified by a string version-id. Texts

228

are normally stored and retrieved as a series of lines, but can

229

also be passed as single strings.

230

231

Lines are stored with the trailing newline (if any) included, to

232

avoid special cases for files with no final newline. Lines are

233

composed of 8-bit characters, not unicode. The combination of

234

these approaches should mean any 'binary' file can be safely

235

stored and retrieved.

236

"""

237

238

def __init__(self, relpath, transport, file_mode=None, access_mode=None, factory=None,

239

basis_knit=None, delta=True, create=False):

240

"""Construct a knit at location specified by relpath.

241

242

:param create: If not True, only open an existing knit.

243

"""

244

if access_mode is None:

245

access_mode = 'w'

246

super(KnitVersionedFile, self).__init__(access_mode)

247

assert access_mode in ('r', 'w'), "invalid mode specified %r" % access_mode

248

assert not basis_knit or isinstance(basis_knit, KnitVersionedFile), \

249

type(basis_knit)

250

251

self.transport = transport

252

self.filename = relpath

253

self.basis_knit = basis_knit

254

self.factory = factory or KnitAnnotateFactory()

255

self.writable = (access_mode == 'w')

256

self.delta = delta

257

258

self._index = _KnitIndex(transport, relpath + INDEX_SUFFIX,

259

access_mode, create=create)

260

self._data = _KnitData(transport, relpath + DATA_SUFFIX,

261

access_mode, create=not len(self.versions()))

262

263

def clear_cache(self):

264

"""Clear the data cache only."""

265

self._data.clear_cache()

266

267

def copy_to(self, name, transport):

268

"""See VersionedFile.copy_to()."""

269

# copy the current index to a temp index to avoid racing with local

270

# writes

271

transport.put(name + INDEX_SUFFIX + '.tmp', self.transport.get(self._index._filename))

272

# copy the data file

273

transport.put(name + DATA_SUFFIX, self._data._open_file())

274

# rename the copied index into place

275

transport.rename(name + INDEX_SUFFIX + '.tmp', name + INDEX_SUFFIX)

276

277

def create_empty(self, name, transport, mode=None):

278

return KnitVersionedFile(name, transport, factory=self.factory, delta=self.delta, create=True)

279

280

def _fix_parents(self, version, new_parents):

281

"""Fix the parents list for version.

282

283

This is done by appending a new version to the index

284

with identical data except for the parents list.

285

the parents list must be a superset of the current

286

list.

287

"""

288

current_values = self._index._cache[version]

289

assert set(current_values[4]).difference(set(new_parents)) == set()

290

self._index.add_version(version,

291

current_values[1],

292

current_values[2],

293

current_values[3],

294

new_parents)

295

296

def get_graph_with_ghosts(self):

297

"""See VersionedFile.get_graph_with_ghosts()."""

298

graph_items = self._index.get_graph()

299

return dict(graph_items)

300

301

@staticmethod

302

def get_suffixes():

303

"""See VersionedFile.get_suffixes()."""

304

return [DATA_SUFFIX, INDEX_SUFFIX]

305

306

def has_ghost(self, version_id):

307

"""True if there is a ghost reference in the file to version_id."""

308

# maybe we have it

309

if self.has_version(version_id):

310

return False

311

# optimisable if needed by memoising the _ghosts set.

312

items = self._index.get_graph()

313

for node, parents in items:

314

for parent in parents:

315

if parent not in self._index._cache:

316

if parent == version_id:

317

return True

318

return False

319

320

def versions(self):

321

"""See VersionedFile.versions."""

322

return self._index.get_versions()

323

324

def has_version(self, version_id):

325

"""See VersionedFile.has_version."""

326

return self._index.has_version(version_id)

327

328

__contains__ = has_version

329

330

def _merge_annotations(self, content, parents):

331

"""Merge annotations for content. This is done by comparing

332

the annotations based on changed to the text."""

333

for parent_id in parents:

334

merge_content = self._get_content(parent_id)

335

seq = SequenceMatcher(None, merge_content.text(), content.text())

336

for i, j, n in seq.get_matching_blocks():

337

if n == 0:

338

continue

339

content._lines[j:j+n] = merge_content._lines[i:i+n]

340

341

def _get_components(self, version_id):

342

"""Return a list of (version_id, method, data) tuples that

343

makes up version specified by version_id of the knit.

344

345

The components should be applied in the order of the returned

346

list.

347

348

The basis knit will be used to the largest extent possible

349

since it is assumed that accesses to it is faster.

350

"""

351

# needed_revisions holds a list of (method, version_id) of

352

# versions that is needed to be fetched to construct the final

353

# version of the file.

354

355

# basis_revisions is a list of versions that needs to be

356

# fetched but exists in the basis knit.

357

358

basis = self.basis_knit

359

needed_versions = []

360

basis_versions = []

361

cursor = version_id

362

363

while 1:

364

picked_knit = self

365

if basis and basis._index.has_version(cursor):

366

picked_knit = basis

367

basis_versions.append(cursor)

368

method = picked_knit._index.get_method(cursor)

369

needed_versions.append((method, cursor))

370

if method == 'fulltext':

371

break

372

cursor = picked_knit.get_parents(cursor)[0]

373

374

components = {}

375

if basis_versions:

376

records = []

377

for comp_id in basis_versions:

378

data_pos, data_size = basis._index.get_data_position(comp_id)

379

records.append((piece_id, data_pos, data_size))

380

components.update(basis._data.read_records(records))

381

382

records = []

383

for comp_id in [vid for method, vid in needed_versions

384

if vid not in basis_versions]:

385

data_pos, data_size = self._index.get_position(comp_id)

386

records.append((comp_id, data_pos, data_size))

387

components.update(self._data.read_records(records))

388

389

# get_data_records returns a mapping with the version id as

390

# index and the value as data. The order the components need

391

# to be applied is held by needed_versions (reversed).

392

out = []

393

for method, comp_id in reversed(needed_versions):

394

out.append((comp_id, method, components[comp_id]))

395

396

return out

397

398

def _get_content(self, version_id):

399

"""Returns a content object that makes up the specified

400

version."""

401

if not self.has_version(version_id):

402

raise RevisionNotPresent(version_id, self.filename)

403

404

if self.basis_knit and version_id in self.basis_knit:

405

return self.basis_knit._get_content(version_id)

406

407

content = None

408

components = self._get_components(version_id)

409

for component_id, method, (data, digest) in components:

410

version_idx = self._index.lookup(component_id)

411

if method == 'fulltext':

412

assert content is None

413

content = self.factory.parse_fulltext(data, version_idx)

414

elif method == 'line-delta':

415

delta = self.factory.parse_line_delta(data, version_idx)

416

content.apply_delta(delta)

417

418

if 'no-eol' in self._index.get_options(version_id):

419

line = content._lines[-1][1].rstrip('\n')

420

content._lines[-1] = (content._lines[-1][0], line)

421

422

if sha_strings(content.text()) != digest:

423

raise KnitCorrupt(self.filename, 'sha-1 does not match')

424

425

return content

426

427

def _check_versions_present(self, version_ids):

428

"""Check that all specified versions are present."""

429

version_ids = set(version_ids)

430

for r in list(version_ids):

431

if self._index.has_version(r):

432

version_ids.remove(r)

433

if version_ids:

434

raise RevisionNotPresent(list(version_ids)[0], self.filename)

435

436

def _add_lines_with_ghosts(self, version_id, parents, lines):

437

"""See VersionedFile.add_lines_with_ghosts()."""

438

self._check_add(version_id, lines)

439

return self._add(version_id, lines[:], parents, self.delta)

440

441

def _add_lines(self, version_id, parents, lines):

442

"""See VersionedFile.add_lines."""

443

self._check_add(version_id, lines)

444

self._check_versions_present(parents)

445

return self._add(version_id, lines[:], parents, self.delta)

446

447

def _check_add(self, version_id, lines):

448

"""check that version_id and lines are safe to add."""

449

assert self.writable, "knit is not opened for write"

450

### FIXME escape. RBC 20060228

451

if contains_whitespace(version_id):

452

raise InvalidRevisionId(version_id)

453

if self.has_version(version_id):

454

raise RevisionAlreadyPresent(version_id, self.filename)

455

456

if False or __debug__:

457

for l in lines:

458

assert '\n' not in l[:-1]

459

460

def _add(self, version_id, lines, parents, delta):

461

"""Add a set of lines on top of version specified by parents.

462

463

If delta is true, compress the text as a line-delta against

464

the first parent.

465

466

Any versions not present will be converted into ghosts.

467

"""

468

ghostless_parents = []

469

ghosts = []

470

for parent in parents:

471

if not self.has_version(parent):

472

ghosts.append(parent)

473

else:

474

ghostless_parents.append(parent)

475

476

if delta and not len(ghostless_parents):

477

delta = False

478

479

digest = sha_strings(lines)

480

options = []

481

if lines:

482

if lines[-1][-1] != '\n':

483

options.append('no-eol')

484

lines[-1] = lines[-1] + '\n'

485

486

lines = self.factory.make(lines, len(self._index))

487

if self.factory.annotated and len(ghostless_parents) > 0:

488

# Merge annotations from parent texts if so is needed.

489

self._merge_annotations(lines, ghostless_parents)

490

491

if len(ghostless_parents) and delta:

492

# To speed the extract of texts the delta chain is limited

493

# to a fixed number of deltas. This should minimize both

494

# I/O and the time spend applying deltas.

495

count = 0

496

delta_parents = ghostless_parents

497

while count < 25:

498

parent = delta_parents[0]

499

method = self._index.get_method(parent)

500

if method == 'fulltext':

501

break

502

delta_parents = self._index.get_parents(parent)

503

count = count + 1

504

if method == 'line-delta':

505

delta = False

506

507

if delta:

508

options.append('line-delta')

509

content = self._get_content(ghostless_parents[0])

510

delta_hunks = content.line_delta(lines)

511

store_lines = self.factory.lower_line_delta(delta_hunks)

512

else:

513

options.append('fulltext')

514

store_lines = self.factory.lower_fulltext(lines)

515

516

where, size = self._data.add_record(version_id, digest, store_lines)

517

self._index.add_version(version_id, options, where, size, parents)

518

519

def check(self, progress_bar=None):

520

"""See VersionedFile.check()."""

521

522

def _clone_text(self, new_version_id, old_version_id, parents):

523

"""See VersionedFile.clone_text()."""

524

# FIXME RBC 20060228 make fast by only inserting an index with null delta.

525

self.add_lines(new_version_id, parents, self.get_lines(old_version_id))

526

527

def get_lines(self, version_id):

528

"""See VersionedFile.get_lines()."""

529

return self._get_content(version_id).text()

530

531

def iter_lines_added_or_present_in_versions(self, version_ids=None):

532

"""See VersionedFile.iter_lines_added_or_present_in_versions()."""

533

if version_ids is None:

534

version_ids = self.versions()

535

# we dont care about inclusions, the caller cares.

536

# but we need to setup a list of records to visit.

537

# we need version_id, position, length

538

version_id_records = []

539

for version_id in version_ids:

540

if not self.has_version(version_id):

541

raise RevisionNotPresent(version_id, self.filename)

542

data_pos, length = self._index.get_position(version_id)

543

version_id_records.append((version_id, data_pos, length))

544

pb = bzrlib.ui.ui_factory.nested_progress_bar()

545

count = 0

546

total = len(version_id_records)

547

try:

548

pb.update('Walking content.', count, total)

549

for version_id, data, sha_value in \

550

self._data.read_records_iter(version_id_records):

551

pb.update('Walking content.', count, total)

552

method = self._index.get_method(version_id)

553

version_idx = self._index.lookup(version_id)

554

assert method in ('fulltext', 'line-delta')

555

if method == 'fulltext':

556

content = self.factory.parse_fulltext(data, version_idx)

557

for line in content.text():

558

yield line

559

else:

560

delta = self.factory.parse_line_delta(data, version_idx)

561

for start, end, count, lines in delta:

562

for origin, line in lines:

563

yield line

564

count +=1

565

pb.update('Walking content.', total, total)

566

pb.finished()

567

except:

568

pb.update('Walking content.', total, total)

569

pb.finished()

570

raise

571

572

def num_versions(self):

573

"""See VersionedFile.num_versions()."""

574

return self._index.num_versions()

575

576

__len__ = num_versions

577

578

def annotate_iter(self, version_id):

579

"""See VersionedFile.annotate_iter."""

580

content = self._get_content(version_id)

581

for origin, text in content.annotate_iter():

582

yield self._index.idx_to_name(origin), text

583

584

def get_parents(self, version_id):

585

"""See VersionedFile.get_parents."""

586

self._check_versions_present([version_id])

587

return list(self._index.get_parents(version_id))

588

589

def get_parents_with_ghosts(self, version_id):

590

"""See VersionedFile.get_parents."""

591

self._check_versions_present([version_id])

592

return list(self._index.get_parents_with_ghosts(version_id))

593

594

def get_ancestry(self, versions):

595

"""See VersionedFile.get_ancestry."""

596

if isinstance(versions, basestring):

597

versions = [versions]

598

if not versions:

599

return []

600

self._check_versions_present(versions)

601

return self._index.get_ancestry(versions)

602

603

def get_ancestry_with_ghosts(self, versions):

604

"""See VersionedFile.get_ancestry_with_ghosts."""

605

if isinstance(versions, basestring):

606

versions = [versions]

607

if not versions:

608

return []

609

self._check_versions_present(versions)

610

return self._index.get_ancestry_with_ghosts(versions)

611

612

def _reannotate_line_delta(self, other, lines, new_version_id,

613

new_version_idx):

614

"""Re-annotate line-delta and return new delta."""

615

new_delta = []

616

for start, end, count, contents \

617

in self.factory.parse_line_delta_iter(lines):

618

new_lines = []

619

for origin, line in contents:

620

old_version_id = other._index.idx_to_name(origin)

621

if old_version_id == new_version_id:

622

idx = new_version_idx

623

else:

624

idx = self._index.lookup(old_version_id)

625

new_lines.append((idx, line))

626

new_delta.append((start, end, count, new_lines))

627

628

return self.factory.lower_line_delta(new_delta)

629

630

def _reannotate_fulltext(self, other, lines, new_version_id,

631

new_version_idx):

632

"""Re-annotate fulltext and return new version."""

633

content = self.factory.parse_fulltext(lines, new_version_idx)

634

new_lines = []

635

for origin, line in content.annotate_iter():

636

old_version_id = other._index.idx_to_name(origin)

637

if old_version_id == new_version_id:

638

idx = new_version_idx

639

else:

640

idx = self._index.lookup(old_version_id)

641

new_lines.append((idx, line))

642

643

return self.factory.lower_fulltext(KnitContent(new_lines))

644

645

#@deprecated_method(zero_eight)

646

def walk(self, version_ids):

647

"""See VersionedFile.walk."""

648

# We take the short path here, and extract all relevant texts

649

# and put them in a weave and let that do all the work. Far

650

# from optimal, but is much simpler.

651

# FIXME RB 20060228 this really is inefficient!

652

from bzrlib.weave import Weave

653

654

w = Weave(self.filename)

655

ancestry = self.get_ancestry(version_ids)

656

sorted_graph = topo_sort(self._index.get_graph())

657

version_list = [vid for vid in sorted_graph if vid in ancestry]

658

659

for version_id in version_list:

660

lines = self.get_lines(version_id)

661

w.add_lines(version_id, self.get_parents(version_id), lines)

662

663

for lineno, insert_id, dset, line in w.walk(version_ids):

664

yield lineno, insert_id, dset, line

665

666

667

class _KnitComponentFile(object):

668

"""One of the files used to implement a knit database"""

669

670

def __init__(self, transport, filename, mode):

671

self._transport = transport

672

self._filename = filename

673

self._mode = mode

674

675

def write_header(self):

676

old_len = self._transport.append(self._filename, StringIO(self.HEADER))

677

if old_len != 0:

678

raise KnitCorrupt(self._filename, 'misaligned after writing header')

679

680

def check_header(self, fp):

681

line = fp.read(len(self.HEADER))

682

if line != self.HEADER:

683

raise KnitHeaderError(badline=line)

684

685

def commit(self):

686

"""Commit is a nop."""

687

688

def __repr__(self):

689

return '%s(%s)' % (self.__class__.__name__, self._filename)

690

691

692

class _KnitIndex(_KnitComponentFile):

693

"""Manages knit index file.

694

695

The index is already kept in memory and read on startup, to enable

696

fast lookups of revision information. The cursor of the index

697

file is always pointing to the end, making it easy to append

698

entries.

699

700

_cache is a cache for fast mapping from version id to a Index

701

object.

702

703

_history is a cache for fast mapping from indexes to version ids.

704

705

The index data format is dictionary compressed when it comes to

706

parent references; a index entry may only have parents that with a

707

lover index number. As a result, the index is topological sorted.

708

709

Duplicate entries may be written to the index for a single version id

710

if this is done then the latter one completely replaces the former:

711

this allows updates to correct version and parent information.

712

Note that the two entries may share the delta, and that successive

713

annotations and references MUST point to the first entry.

714

"""

715

716

HEADER = "# bzr knit index 7\n"

717

718

def _cache_version(self, version_id, options, pos, size, parents):

719

val = (version_id, options, pos, size, parents)

720

self._cache[version_id] = val

721

if not version_id in self._history:

722

self._history.append(version_id)

723

724

def _iter_index(self, fp):

725

l = fp.readline()

726

while l != '':

727

yield l.split()

728

l = fp.readline()

729

#lines = fp.read()

730

#for l in lines.splitlines(False):

731

# yield l.split()

732

733

def __init__(self, transport, filename, mode, create=False):

734

_KnitComponentFile.__init__(self, transport, filename, mode)

735

self._cache = {}

736

# position in _history is the 'official' index for a revision

737

# but the values may have come from a newer entry.

738

# so - wc -l of a knit index is != the number of uniqe names

739

# in the weave.

740

self._history = []

741

pb = bzrlib.ui.ui_factory.nested_progress_bar()

742

try:

743

count = 0

744

total = 1

745

try:

746

pb.update('read knit index', count, total)

747

fp = self._transport.get(self._filename)

748

self.check_header(fp)

749

for rec in self._iter_index(fp):

750

count += 1

751

total += 1

752

pb.update('read knit index', count, total)

753

parents = self._parse_parents(rec[4:])

754

self._cache_version(rec[0], rec[1].split(','), int(rec[2]), int(rec[3]),

755

parents)

756

except NoSuchFile, e:

757

if mode != 'w' or not create:

758

raise

759

self.write_header()

760

finally:

761

pb.update('read knit index', total, total)

762

pb.finished()

763

764

def _parse_parents(self, compressed_parents):

765

"""convert a list of string parent values into version ids.

766

767

ints are looked up in the index.

768

.FOO values are ghosts and converted in to FOO.

769

"""

770

result = []

771

for value in compressed_parents:

772

if value.startswith('.'):

773

result.append(value[1:])

774

else:

775

assert isinstance(value, str)

776

result.append(self._history[int(value)])

777

return result

778

779

def get_graph(self):

780

graph = []

781

for version_id, index in self._cache.iteritems():

782

graph.append((version_id, index[4]))

783

return graph

784

785

def get_ancestry(self, versions):

786

"""See VersionedFile.get_ancestry."""

787

# get a graph of all the mentioned versions:

788

graph = {}

789

pending = set(versions)

790

while len(pending):

791

version = pending.pop()

792

parents = self._cache[version][4]

793

# got the parents ok

794

# trim ghosts

795

parents = [parent for parent in parents if parent in self._cache]

796

for parent in parents:

797

# if not completed and not a ghost

798

if parent not in graph:

799

pending.add(parent)

800

graph[version] = parents

801

return topo_sort(graph.items())

802

803

def get_ancestry_with_ghosts(self, versions):

804

"""See VersionedFile.get_ancestry_with_ghosts."""

805

# get a graph of all the mentioned versions:

806

graph = {}

807

pending = set(versions)

808

while len(pending):

809

version = pending.pop()

810

try:

811

parents = self._cache[version][4]

812

except KeyError:

813

# ghost, fake it

814

graph[version] = []

815

pass

816

else:

817

# got the parents ok

818

for parent in parents:

819

if parent not in graph:

820

pending.add(parent)

821

graph[version] = parents

822

return topo_sort(graph.items())

823

824

def num_versions(self):

825

return len(self._history)

826

827

__len__ = num_versions

828

829

def get_versions(self):

830

return self._history

831

832

def idx_to_name(self, idx):

833

return self._history[idx]

834

835

def lookup(self, version_id):

836

assert version_id in self._cache

837

return self._history.index(version_id)

838

839

def _version_list_to_index(self, versions):

840

result_list = []

841

for version in versions:

842

if version in self._cache:

843

result_list.append(str(self._history.index(version)))

844

else:

845

result_list.append('.' + version.encode('utf-8'))

846

return ' '.join(result_list)

847

848

def add_version(self, version_id, options, pos, size, parents):

849

"""Add a version record to the index."""

850

self._cache_version(version_id, options, pos, size, parents)

851

852

content = "%s %s %s %s %s\n" % (version_id,

853

','.join(options),

854

pos,

855

size,

856

self._version_list_to_index(parents))

857

self._transport.append(self._filename, StringIO(content))

858

859

def has_version(self, version_id):

860

"""True if the version is in the index."""

861

return self._cache.has_key(version_id)

862

863

def get_position(self, version_id):

864

"""Return data position and size of specified version."""

865

return (self._cache[version_id][2], \

866

self._cache[version_id][3])

867

868

def get_method(self, version_id):

869

"""Return compression method of specified version."""

870

options = self._cache[version_id][1]

871

if 'fulltext' in options:

872

return 'fulltext'

873

else:

874

assert 'line-delta' in options

875

return 'line-delta'

876

877

def get_options(self, version_id):

878

return self._cache[version_id][1]

879

880

def get_parents(self, version_id):

881

"""Return parents of specified version ignoring ghosts."""

882

return [parent for parent in self._cache[version_id][4]

883

if parent in self._cache]

884

885

def get_parents_with_ghosts(self, version_id):

886

"""Return parents of specified version wth ghosts."""

887

return self._cache[version_id][4]

888

889

def check_versions_present(self, version_ids):

890

"""Check that all specified versions are present."""

891

version_ids = set(version_ids)

892

for version_id in list(version_ids):

893

if version_id in self._cache:

894

version_ids.remove(version_id)

895

if version_ids:

896

raise RevisionNotPresent(list(version_ids)[0], self.filename)

897

898

899

class _KnitData(_KnitComponentFile):

900

"""Contents of the knit data file"""

901

902

HEADER = "# bzr knit data 7\n"

903

904

def __init__(self, transport, filename, mode, create=False):

905

_KnitComponentFile.__init__(self, transport, filename, mode)

906

self._file = None

907

self._checked = False

908

if create:

909

self._transport.put(self._filename, StringIO(''))

910

self._records = {}

911

912

def clear_cache(self):

913

"""Clear the record cache."""

914

self._records = {}

915

916

def _open_file(self):

917

if self._file is None:

918

try:

919

self._file = self._transport.get(self._filename)

920

except NoSuchFile:

921

pass

922

return self._file

923

924

def add_record(self, version_id, digest, lines):

925

"""Write new text record to disk. Returns the position in the

926

file where it was written."""

927

sio = StringIO()

928

data_file = GzipFile(None, mode='wb', fileobj=sio)

929

print >>data_file, "version %s %d %s" % (version_id, len(lines), digest)

930

data_file.writelines(lines)

931

print >>data_file, "end %s\n" % version_id

932

data_file.close()

933

934

# cache

935

self._records[version_id] = (digest, lines)

936

937

content = sio.getvalue()

938

sio.seek(0)

939

start_pos = self._transport.append(self._filename, sio)

940

return start_pos, len(content)

941

942

def _parse_record(self, version_id, data):

943

df = GzipFile(mode='rb', fileobj=StringIO(data))

944

rec = df.readline().split()

945

if len(rec) != 4:

946

raise KnitCorrupt(self._filename, 'unexpected number of records')

947

if rec[1] != version_id:

948

raise KnitCorrupt(self.file.name,

949

'unexpected version, wanted %r' % version_id)

950

lines = int(rec[2])

951

record_contents = self._read_record_contents(df, lines)

952

l = df.readline()

953

if l != 'end %s\n' % version_id:

954

raise KnitCorrupt(self._filename, 'unexpected version end line %r, wanted %r'

955

% (l, version_id))

956

return record_contents, rec[3]

957

958

def _read_record_contents(self, df, record_lines):

959

"""Read and return n lines from datafile."""

960

r = []

961

for i in range(record_lines):

962

r.append(df.readline())

963

return r

964

965

def read_records_iter(self, records):

966

"""Read text records from data file and yield result.

967

968

Each passed record is a tuple of (version_id, pos, len) and

969

will be read in the given order. Yields (version_id,

970

contents, digest).

971

"""

972

973

needed_records = []

974

for version_id, pos, size in records:

975

if version_id not in self._records:

976

needed_records.append((version_id, pos, size))

977

978

if len(needed_records):

979

# We take it that the transport optimizes the fetching as good

980

# as possible (ie, reads continous ranges.)

981

response = self._transport.readv(self._filename,

982

[(pos, size) for version_id, pos, size in needed_records])

983

984

for (record_id, pos, size), (pos, data) in izip(iter(records), response):

985

content, digest = self._parse_record(record_id, data)

986

self._records[record_id] = (digest, content)

987

988

for version_id, pos, size in records:

989

yield version_id, copy(self._records[version_id][1]), copy(self._records[version_id][0])

990

991

def read_records(self, records):

992

"""Read records into a dictionary."""

993

components = {}

994

for record_id, content, digest in self.read_records_iter(records):

995

components[record_id] = (content, digest)

996

return components

997

998

999

class InterKnit(InterVersionedFile):

1000

"""Optimised code paths for knit to knit operations."""

1001

1002

_matching_file_factory = KnitVersionedFile

1003

1004

@staticmethod

1005

def is_compatible(source, target):

1006

"""Be compatible with knits. """

1007

try:

1008

return (isinstance(source, KnitVersionedFile) and

1009

isinstance(target, KnitVersionedFile))

1010

except AttributeError:

1011

return False

1012

1013

def join(self, pb=None, msg=None, version_ids=None, ignore_missing=False):

1014

"""See InterVersionedFile.join."""

1015

assert isinstance(self.source, KnitVersionedFile)

1016

assert isinstance(self.target, KnitVersionedFile)

1017

1018

if version_ids is None:

1019

version_ids = self.source.versions()

1020

else:

1021

if not ignore_missing:

1022

self.source._check_versions_present(version_ids)

1023

else:

1024

version_ids = set(self.source.versions()).intersection(

1025

set(version_ids))

1026

1027

if not version_ids:

1028

return 0

1029

1030

pb = bzrlib.ui.ui_factory.nested_progress_bar()

1031

try:

1032

version_ids = list(version_ids)

1033

if None in version_ids:

1034

version_ids.remove(None)

1035

1036

self.source_ancestry = set(self.source.get_ancestry(version_ids))

1037

this_versions = set(self.target._index.get_versions())

1038

needed_versions = self.source_ancestry - this_versions

1039

cross_check_versions = self.source_ancestry.intersection(this_versions)

1040

mismatched_versions = set()

1041

for version in cross_check_versions:

1042

# scan to include needed parents.

1043

n1 = set(self.target.get_parents_with_ghosts(version))

1044

n2 = set(self.source.get_parents_with_ghosts(version))

1045

if n1 != n2:

1046

# FIXME TEST this check for cycles being introduced works

1047

# the logic is we have a cycle if in our graph we are an

1048

# ancestor of any of the n2 revisions.

1049

for parent in n2:

1050

if parent in n1:

1051

# safe

1052

continue

1053

else:

1054

parent_ancestors = self.source.get_ancestry(parent)

1055

if version in parent_ancestors:

1056

raise errors.GraphCycleError([parent, version])

1057

# ensure this parent will be available later.

1058

new_parents = n2.difference(n1)

1059

needed_versions.update(new_parents.difference(this_versions))

1060

mismatched_versions.add(version)

1061

1062

if not needed_versions and not cross_check_versions:

1063

return 0

1064

full_list = topo_sort(self.source.get_graph())

1065

1066

version_list = [i for i in full_list if (not self.target.has_version(i)

1067

and i in needed_versions)]

1068

1069

records = []

1070

for version_id in version_list:

1071

data_pos, data_size = self.source._index.get_position(version_id)

1072

records.append((version_id, data_pos, data_size))

1073

1074

count = 0

1075

for version_id, lines, digest \

1076

in self.source._data.read_records_iter(records):

1077

options = self.source._index.get_options(version_id)

1078

parents = self.source._index.get_parents_with_ghosts(version_id)

1079

1080

for parent in parents:

1081

# if source has the parent, we must hav grabbed it first.

1082

assert (self.target.has_version(parent) or not

1083

self.source.has_version(parent))

1084

1085

if self.target.factory.annotated:

1086

# FIXME jrydberg: it should be possible to skip

1087

# re-annotating components if we know that we are

1088

# going to pull all revisions in the same order.

1089

new_version_id = version_id

1090

new_version_idx = self.target._index.num_versions()

1091

if 'fulltext' in options:

1092

lines = self.target._reannotate_fulltext(self.source, lines,

1093

new_version_id, new_version_idx)

1094

elif 'line-delta' in options:

1095

lines = self.target._reannotate_line_delta(self.source, lines,

1096

new_version_id, new_version_idx)

1097

1098

count = count + 1

1099

pb.update("Joining knit", count, len(version_list))

1100

1101

pos, size = self.target._data.add_record(version_id, digest, lines)

1102

self.target._index.add_version(version_id, options, pos, size, parents)

1103

1104

for version in mismatched_versions:

1105

n1 = set(self.target.get_parents_with_ghosts(version))

1106

n2 = set(self.source.get_parents_with_ghosts(version))

1107

# write a combined record to our history preserving the current

1108

# parents as first in the list

1109

new_parents = self.target.get_parents_with_ghosts(version) + list(n2.difference(n1))

1110

self.target.fix_parents(version, new_parents)

1111

return count

1112

finally:

1113

pb.clear()

1114

pb.finished()

1115

1116

1117

InterVersionedFile.register_optimiser(InterKnit)

Older »