/brz/remove-bazaar : revision 1570.1.7

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/repository.py

Committer: Robert Collins
Date: 2006-02-24 23:13:20 UTC
mto: (1587.1.1 integration)
mto: This revision was merged to the branch mainline in revision 1588.
Revision ID: robertc@robertcollins.net-20060224231320-dbaf879d3070bfd7

Replace the slow topo_sort routine with a much faster one for non trivial datasets.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

generate_docs.py

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

from copy import deepcopy

from cStringIO import StringIO

from unittest import TestSuite

import xml.sax.saxutils

from bzrlib.decorators import needs_read_lock, needs_write_lock

import bzrlib.errors as errors

from bzrlib.errors import InvalidRevisionId

import bzrlib.gpg as gpg

from bzrlib.lockable_files import LockableFiles

from bzrlib.osutils import safe_unicode

from bzrlib.revision import NULL_REVISION

from bzrlib.store import copy_all

from bzrlib.store.weave import WeaveStore

from bzrlib.store.text import TextStore

from bzrlib.symbol_versioning import *

from bzrlib.trace import mutter

from bzrlib.tree import RevisionTree

from bzrlib.testament import Testament

from bzrlib.tree import EmptyTree

import bzrlib.ui

import bzrlib.xml5

class Repository(object):

"""Repository holding history for one or more branches.

The repository holds and retrieves historical information including

revisions and file history. It's normally accessed only by the Branch,

which views a particular line of development through that history.

The Repository builds on top of Stores and a Transport, which respectively

describe the disk data format and the way of accessing the (possibly

remote) disk.

"""

@needs_write_lock

def add_inventory(self, revid, inv, parents):

"""Add the inventory inv to the repository as revid.

:param parents: The revision ids of the parents that revid

is known to have and are in the repository already.

returns the sha1 of the serialized inventory.

"""

inv_text = bzrlib.xml5.serializer_v5.write_inventory_to_string(inv)

inv_sha1 = bzrlib.osutils.sha_string(inv_text)

self.control_weaves.add_text('inventory', revid,

bzrlib.osutils.split_lines(inv_text), parents,

self.get_transaction())

return inv_sha1

@needs_write_lock

def add_revision(self, rev_id, rev, inv=None, config=None):

"""Add rev to the revision store as rev_id.

:param rev_id: the revision id to use.

:param rev: The revision object.

:param inv: The inventory for the revision. if None, it will be looked

up in the inventory storer

:param config: If None no digital signature will be created.

If supplied its signature_needed method will be used

to determine if a signature should be made.

"""

if config is not None and config.signature_needed():

if inv is None:

inv = self.get_inventory(rev_id)

plaintext = Testament(rev, inv).as_short_text()

self.store_revision_signature(

gpg.GPGStrategy(config), plaintext, rev_id)

if not rev_id in self.get_inventory_weave():

if inv is None:

raise errors.WeaveRevisionNotPresent(rev_id,

self.get_inventory_weave())

else:

# yes, this is not suitable for adding with ghosts.

self.add_inventory(rev_id, inv, rev.parent_ids)

rev_tmp = StringIO()

bzrlib.xml5.serializer_v5.write_revision(rev, rev_tmp)

rev_tmp.seek(0)

self.revision_store.add(rev_tmp, rev_id)

100

mutter('added revision_id {%s}', rev_id)

101

102

@needs_read_lock

103

def _all_possible_ids(self):

104

"""Return all the possible revisions that we could find."""

105

return self.get_inventory_weave().names()

106

107

@needs_read_lock

108

def all_revision_ids(self):

109

"""Returns a list of all the revision ids in the repository.

110

111

These are in as much topological order as the underlying store can

112

present: for weaves ghosts may lead to a lack of correctness until

113

the reweave updates the parents list.

114

"""

115

result = self._all_possible_ids()

116

return self._eliminate_revisions_not_present(result)

117

118

@needs_read_lock

119

def _eliminate_revisions_not_present(self, revision_ids):

120

"""Check every revision id in revision_ids to see if we have it.

121

122

Returns a set of the present revisions.

123

"""

124

result = []

125

for id in revision_ids:

126

if self.has_revision(id):

127

result.append(id)

128

return result

129

130

@staticmethod

131

def create(a_bzrdir):

132

"""Construct the current default format repository in a_bzrdir."""

133

return RepositoryFormat.get_default_format().initialize(a_bzrdir)

134

135

def __init__(self, _format, a_bzrdir, control_files, revision_store):

136

"""instantiate a Repository.

137

138

:param _format: The format of the repository on disk.

139

:param a_bzrdir: The BzrDir of the repository.

140

141

In the future we will have a single api for all stores for

142

getting file texts, inventories and revisions, then

143

this construct will accept instances of those things.

144

"""

145

object.__init__(self)

146

self._format = _format

147

# the following are part of the public API for Repository:

148

self.bzrdir = a_bzrdir

149

self.control_files = control_files

150

self.revision_store = revision_store

151

152

def lock_write(self):

153

self.control_files.lock_write()

154

155

def lock_read(self):

156

self.control_files.lock_read()

157

158

@needs_read_lock

159

def missing_revision_ids(self, other, revision_id=None):

160

"""Return the revision ids that other has that this does not.

161

162

These are returned in topological order.

163

164

revision_id: only return revision ids included by revision_id.

165

"""

166

return InterRepository.get(other, self).missing_revision_ids(revision_id)

167

168

@staticmethod

169

def open(base):

170

"""Open the repository rooted at base.

171

172

For instance, if the repository is at URL/.bzr/repository,

173

Repository.open(URL) -> a Repository instance.

174

"""

175

control = bzrlib.bzrdir.BzrDir.open(base)

176

return control.open_repository()

177

178

def copy_content_into(self, destination, revision_id=None, basis=None):

179

"""Make a complete copy of the content in self into destination.

180

181

This is a destructive operation! Do not use it on existing

182

repositories.

183

"""

184

return InterRepository.get(self, destination).copy_content(revision_id, basis)

185

186

def fetch(self, source, revision_id=None, pb=None):

187

"""Fetch the content required to construct revision_id from source.

188

189

If revision_id is None all content is copied.

190

"""

191

return InterRepository.get(source, self).fetch(revision_id=revision_id,

192

pb=pb)

193

194

def unlock(self):

195

self.control_files.unlock()

196

197

@needs_read_lock

198

def clone(self, a_bzrdir, revision_id=None, basis=None):

199

"""Clone this repository into a_bzrdir using the current format.

200

201

Currently no check is made that the format of this repository and

202

the bzrdir format are compatible. FIXME RBC 20060201.

203

"""

204

if not isinstance(a_bzrdir._format, self.bzrdir._format.__class__):

205

# use target default format.

206

result = a_bzrdir.create_repository()

207

# FIXME RBC 20060209 split out the repository type to avoid this check ?

208

elif isinstance(a_bzrdir._format,

209

(bzrlib.bzrdir.BzrDirFormat4,

210

bzrlib.bzrdir.BzrDirFormat5,

211

bzrlib.bzrdir.BzrDirFormat6)):

212

result = a_bzrdir.open_repository()

213

else:

214

result = self._format.initialize(a_bzrdir, shared=self.is_shared())

215

self.copy_content_into(result, revision_id, basis)

216

return result

217

218

def has_revision(self, revision_id):

219

"""True if this branch has a copy of the revision.

220

221

This does not necessarily imply the revision is merge

222

or on the mainline."""

223

return (revision_id is None

224

or self.revision_store.has_id(revision_id))

225

226

@needs_read_lock

227

def get_revision_xml_file(self, revision_id):

228

"""Return XML file object for revision object."""

229

if not revision_id or not isinstance(revision_id, basestring):

230

raise InvalidRevisionId(revision_id=revision_id, branch=self)

231

try:

232

return self.revision_store.get(revision_id)

233

except (IndexError, KeyError):

234

raise bzrlib.errors.NoSuchRevision(self, revision_id)

235

236

@needs_read_lock

237

def get_revision_xml(self, revision_id):

238

return self.get_revision_xml_file(revision_id).read()

239

240

@needs_read_lock

241

def get_revision(self, revision_id):

242

"""Return the Revision object for a named revision"""

243

xml_file = self.get_revision_xml_file(revision_id)

244

245

try:

246

r = bzrlib.xml5.serializer_v5.read_revision(xml_file)

247

except SyntaxError, e:

248

raise bzrlib.errors.BzrError('failed to unpack revision_xml',

249

[revision_id,

250

str(e)])

251

252

assert r.revision_id == revision_id

253

return r

254

255

@needs_read_lock

256

def get_revision_sha1(self, revision_id):

257

"""Hash the stored value of a revision, and return it."""

258

# In the future, revision entries will be signed. At that

259

# point, it is probably best *not* to include the signature

260

# in the revision hash. Because that lets you re-sign

261

# the revision, (add signatures/remove signatures) and still

262

# have all hash pointers stay consistent.

263

# But for now, just hash the contents.

264

return bzrlib.osutils.sha_file(self.get_revision_xml_file(revision_id))

265

266

@needs_write_lock

267

def store_revision_signature(self, gpg_strategy, plaintext, revision_id):

268

self.revision_store.add(StringIO(gpg_strategy.sign(plaintext)),

269

revision_id, "sig")

270

271

def fileid_involved_between_revs(self, from_revid, to_revid):

272

"""Find file_id(s) which are involved in the changes between revisions.

273

274

This determines the set of revisions which are involved, and then

275

finds all file ids affected by those revisions.

276

"""

277

# TODO: jam 20060119 This code assumes that w.inclusions will

278

# always be correct. But because of the presence of ghosts

279

# it is possible to be wrong.

280

# One specific example from Robert Collins:

281

# Two branches, with revisions ABC, and AD

282

# C is a ghost merge of D.

283

# Inclusions doesn't recognize D as an ancestor.

284

# If D is ever merged in the future, the weave

285

# won't be fixed, because AD never saw revision C

286

# to cause a conflict which would force a reweave.

287

w = self.get_inventory_weave()

288

from_set = set(w.inclusions([w.lookup(from_revid)]))

289

to_set = set(w.inclusions([w.lookup(to_revid)]))

290

included = to_set.difference(from_set)

291

changed = map(w.idx_to_name, included)

292

return self._fileid_involved_by_set(changed)

293

294

def fileid_involved(self, last_revid=None):

295

"""Find all file_ids modified in the ancestry of last_revid.

296

297

:param last_revid: If None, last_revision() will be used.

298

"""

299

w = self.get_inventory_weave()

300

if not last_revid:

301

changed = set(w._names)

302

else:

303

included = w.inclusions([w.lookup(last_revid)])

304

changed = map(w.idx_to_name, included)

305

return self._fileid_involved_by_set(changed)

306

307

def fileid_involved_by_set(self, changes):

308

"""Find all file_ids modified by the set of revisions passed in.

309

310

:param changes: A set() of revision ids

311

"""

312

# TODO: jam 20060119 This line does *nothing*, remove it.

313

# or better yet, change _fileid_involved_by_set so

314

# that it takes the inventory weave, rather than

315

# pulling it out by itself.

316

return self._fileid_involved_by_set(changes)

317

318

def _fileid_involved_by_set(self, changes):

319

"""Find the set of file-ids affected by the set of revisions.

320

321

:param changes: A set() of revision ids.

322

:return: A set() of file ids.

323

324

This peaks at the Weave, interpreting each line, looking to

325

see if it mentions one of the revisions. And if so, includes

326

the file id mentioned.

327

This expects both the Weave format, and the serialization

328

to have a single line per file/directory, and to have

329

fileid="" and revision="" on that line.

330

"""

331

assert isinstance(self._format, (RepositoryFormat5,

332

RepositoryFormat6,

333

RepositoryFormat7,

334

RepositoryFormatKnit1)), \

335

"fileid_involved only supported for branches which store inventory as unnested xml"

336

337

w = self.get_inventory_weave()

338

file_ids = set()

339

for line in w._weave:

340

341

# it is ugly, but it is due to the weave structure

342

if not isinstance(line, basestring): continue

343

344

start = line.find('file_id="')+9

345

if start < 9: continue

346

end = line.find('"', start)

347

assert end>= 0

348

file_id = xml.sax.saxutils.unescape(line[start:end])

349

350

# check if file_id is already present

351

if file_id in file_ids: continue

352

353

start = line.find('revision="')+10

354

if start < 10: continue

355

end = line.find('"', start)

356

assert end>= 0

357

revision_id = xml.sax.saxutils.unescape(line[start:end])

358

359

if revision_id in changes:

360

file_ids.add(file_id)

361

return file_ids

362

363

@needs_read_lock

364

def get_inventory_weave(self):

365

return self.control_weaves.get_weave('inventory',

366

self.get_transaction())

367

368

@needs_read_lock

369

def get_inventory(self, revision_id):

370

"""Get Inventory object by hash."""

371

xml = self.get_inventory_xml(revision_id)

372

return bzrlib.xml5.serializer_v5.read_inventory_from_string(xml)

373

374

@needs_read_lock

375

def get_inventory_xml(self, revision_id):

376

"""Get inventory XML as a file object."""

377

try:

378

assert isinstance(revision_id, basestring), type(revision_id)

379

iw = self.get_inventory_weave()

380

return iw.get_text(iw.lookup(revision_id))

381

except IndexError:

382

raise bzrlib.errors.HistoryMissing(self, 'inventory', revision_id)

383

384

@needs_read_lock

385

def get_inventory_sha1(self, revision_id):

386

"""Return the sha1 hash of the inventory entry

387

"""

388

return self.get_revision(revision_id).inventory_sha1

389

390

@needs_read_lock

391

def get_revision_inventory(self, revision_id):

392

"""Return inventory of a past revision."""

393

# TODO: Unify this with get_inventory()

394

# bzr 0.0.6 and later imposes the constraint that the inventory_id

395

# must be the same as its revision, so this is trivial.

396

if revision_id is None:

397

# This does not make sense: if there is no revision,

398

# then it is the current tree inventory surely ?!

399

# and thus get_root_id() is something that looks at the last

400

# commit on the branch, and the get_root_id is an inventory check.

401

raise NotImplementedError

402

# return Inventory(self.get_root_id())

403

else:

404

return self.get_inventory(revision_id)

405

406

@needs_read_lock

407

def is_shared(self):

408

"""Return True if this repository is flagged as a shared repository."""

409

# FIXME format 4-6 cannot be shared, this is technically faulty.

410

return self.control_files._transport.has('shared-storage')

411

412

@needs_read_lock

413

def revision_tree(self, revision_id):

414

"""Return Tree for a revision on this branch.

415

416

`revision_id` may be None for the null revision, in which case

417

an `EmptyTree` is returned."""

418

# TODO: refactor this to use an existing revision object

419

# so we don't need to read it in twice.

420

if revision_id is None or revision_id == NULL_REVISION:

421

return EmptyTree()

422

else:

423

inv = self.get_revision_inventory(revision_id)

424

return RevisionTree(self, inv, revision_id)

425

426

@needs_read_lock

427

def get_ancestry(self, revision_id):

428

"""Return a list of revision-ids integrated by a revision.

429

430

This is topologically sorted.

431

"""

432

if revision_id is None:

433

return [None]

434

if not self.has_revision(revision_id):

435

raise errors.NoSuchRevision(self, revision_id)

436

w = self.get_inventory_weave()

437

return [None] + map(w.idx_to_name,

438

w.inclusions([w.lookup(revision_id)]))

439

440

@needs_read_lock

441

def print_file(self, file, revision_id):

442

"""Print `file` to stdout.

443

444

FIXME RBC 20060125 as John Meinel points out this is a bad api

445

- it writes to stdout, it assumes that that is valid etc. Fix

446

by creating a new more flexible convenience function.

447

"""

448

tree = self.revision_tree(revision_id)

449

# use inventory as it was in that revision

450

file_id = tree.inventory.path2id(file)

451

if not file_id:

452

raise BzrError("%r is not present in revision %s" % (file, revno))

453

try:

454

revno = self.revision_id_to_revno(revision_id)

455

except errors.NoSuchRevision:

456

# TODO: This should not be BzrError,

457

# but NoSuchFile doesn't fit either

458

raise BzrError('%r is not present in revision %s'

459

% (file, revision_id))

460

else:

461

raise BzrError('%r is not present in revision %s'

462

% (file, revno))

463

tree.print_file(file_id)

464

465

def get_transaction(self):

466

return self.control_files.get_transaction()

467

468

@needs_write_lock

469

def set_make_working_trees(self, new_value):

470

"""Set the policy flag for making working trees when creating branches.

471

472

This only applies to branches that use this repository.

473

474

The default is 'True'.

475

:param new_value: True to restore the default, False to disable making

476

working trees.

477

"""

478

# FIXME: split out into a new class/strategy ?

479

if isinstance(self._format, (RepositoryFormat4,

480

RepositoryFormat5,

481

RepositoryFormat6)):

482

raise NotImplementedError(self.set_make_working_trees)

483

if new_value:

484

try:

485

self.control_files._transport.delete('no-working-trees')

486

except errors.NoSuchFile:

487

pass

488

else:

489

self.control_files.put_utf8('no-working-trees', '')

490

491

def make_working_trees(self):

492

"""Returns the policy for making working trees on new branches."""

493

# FIXME: split out into a new class/strategy ?

494

if isinstance(self._format, (RepositoryFormat4,

495

RepositoryFormat5,

496

RepositoryFormat6)):

497

return True

498

return not self.control_files._transport.has('no-working-trees')

499

500

@needs_write_lock

501

def sign_revision(self, revision_id, gpg_strategy):

502

plaintext = Testament.from_revision(self, revision_id).as_short_text()

503

self.store_revision_signature(gpg_strategy, plaintext, revision_id)

504

505

506

class AllInOneRepository(Repository):

507

"""Legacy support - the repository behaviour for all-in-one branches."""

508

509

def __init__(self, _format, a_bzrdir, revision_store):

510

# we reuse one control files instance.

511

dir_mode = a_bzrdir._control_files._dir_mode

512

file_mode = a_bzrdir._control_files._file_mode

513

514

def get_weave(name, prefixed=False):

515

if name:

516

name = safe_unicode(name)

517

else:

518

name = ''

519

relpath = a_bzrdir._control_files._escape(name)

520

weave_transport = a_bzrdir._control_files._transport.clone(relpath)

521

ws = WeaveStore(weave_transport, prefixed=prefixed,

522

dir_mode=dir_mode,

523

file_mode=file_mode)

524

if a_bzrdir._control_files._transport.should_cache():

525

ws.enable_cache = True

526

return ws

527

528

def get_store(name, compressed=True, prefixed=False):

529

# FIXME: This approach of assuming stores are all entirely compressed

530

# or entirely uncompressed is tidy, but breaks upgrade from

531

# some existing branches where there's a mixture; we probably

532

# still want the option to look for both.

533

relpath = a_bzrdir._control_files._escape(name)

534

store = TextStore(a_bzrdir._control_files._transport.clone(relpath),

535

prefixed=prefixed, compressed=compressed,

536

dir_mode=dir_mode,

537

file_mode=file_mode)

538

#if self._transport.should_cache():

539

# cache_path = os.path.join(self.cache_root, name)

540

# os.mkdir(cache_path)

541

# store = bzrlib.store.CachedStore(store, cache_path)

542

return store

543

544

# not broken out yet because the controlweaves|inventory_store

545

# and text_store | weave_store bits are still different.

546

if isinstance(_format, RepositoryFormat4):

547

self.inventory_store = get_store('inventory-store')

548

self.text_store = get_store('text-store')

549

elif isinstance(_format, RepositoryFormat5):

550

self.control_weaves = get_weave('')

551

self.weave_store = get_weave('weaves')

552

elif isinstance(_format, RepositoryFormat6):

553

self.control_weaves = get_weave('')

554

self.weave_store = get_weave('weaves', prefixed=True)

555

else:

556

raise errors.BzrError('unreachable code: unexpected repository'

557

' format.')

558

revision_store.register_suffix('sig')

559

super(AllInOneRepository, self).__init__(_format, a_bzrdir, a_bzrdir._control_files, revision_store)

560

561

562

class MetaDirRepository(Repository):

563

"""Repositories in the new meta-dir layout."""

564

565

def __init__(self, _format, a_bzrdir, control_files, revision_store):

566

super(MetaDirRepository, self).__init__(_format,

567

a_bzrdir,

568

control_files,

569

revision_store)

570

571

dir_mode = self.control_files._dir_mode

572

file_mode = self.control_files._file_mode

573

574

def get_weave(name, prefixed=False):

575

if name:

576

name = safe_unicode(name)

577

else:

578

name = ''

579

relpath = self.control_files._escape(name)

580

weave_transport = self.control_files._transport.clone(relpath)

581

ws = WeaveStore(weave_transport, prefixed=prefixed,

582

dir_mode=dir_mode,

583

file_mode=file_mode)

584

if self.control_files._transport.should_cache():

585

ws.enable_cache = True

586

return ws

587

588

if isinstance(self._format, RepositoryFormat7):

589

self.control_weaves = get_weave('')

590

self.weave_store = get_weave('weaves', prefixed=True)

591

elif isinstance(self._format, RepositoryFormatKnit1):

592

self.control_weaves = get_weave('')

593

self.weave_store = get_weave('knits', prefixed=True)

594

else:

595

raise errors.BzrError('unreachable code: unexpected repository'

596

' format.')

597

598

599

class RepositoryFormat(object):

600

"""A repository format.

601

602

Formats provide three things:

603

* An initialization routine to construct repository data on disk.

604

* a format string which is used when the BzrDir supports versioned

605

children.

606

* an open routine which returns a Repository instance.

607

608

Formats are placed in an dict by their format string for reference

609

during opening. These should be subclasses of RepositoryFormat

610

for consistency.

611

612

Once a format is deprecated, just deprecate the initialize and open

613

methods on the format class. Do not deprecate the object, as the

614

object will be created every system load.

615

616

Common instance attributes:

617

_matchingbzrdir - the bzrdir format that the repository format was

618

originally written to work with. This can be used if manually

619

constructing a bzrdir and repository, or more commonly for test suite

620

parameterisation.

621

"""

622

623

_default_format = None

624

"""The default format used for new repositories."""

625

626

_formats = {}

627

"""The known formats."""

628

629

@classmethod

630

def find_format(klass, a_bzrdir):

631

"""Return the format for the repository object in a_bzrdir."""

632

try:

633

transport = a_bzrdir.get_repository_transport(None)

634

format_string = transport.get("format").read()

635

return klass._formats[format_string]

636

except errors.NoSuchFile:

637

raise errors.NoRepositoryPresent(a_bzrdir)

638

except KeyError:

639

raise errors.UnknownFormatError(format_string)

640

641

@classmethod

642

def get_default_format(klass):

643

"""Return the current default format."""

644

return klass._default_format

645

646

def get_format_string(self):

647

"""Return the ASCII format string that identifies this format.

648

649

Note that in pre format ?? repositories the format string is

650

not permitted nor written to disk.

651

"""

652

raise NotImplementedError(self.get_format_string)

653

654

def _get_revision_store(self, repo_transport, control_files):

655

"""Return the revision store object for this a_bzrdir."""

656

raise NotImplementedError(self._get_revision_store)

657

658

def _get_rev_store(self,

659

transport,

660

control_files,

661

name,

662

compressed=True,

663

prefixed=False):

664

"""Common logic for getting a revision store for a repository.

665

666

see self._get_revision_store for the method to

667

get the store for a repository.

668

"""

669

if name:

670

name = safe_unicode(name)

671

else:

672

name = ''

673

dir_mode = control_files._dir_mode

674

file_mode = control_files._file_mode

675

revision_store =TextStore(transport.clone(name),

676

prefixed=prefixed,

677

compressed=compressed,

678

dir_mode=dir_mode,

679

file_mode=file_mode)

680

revision_store.register_suffix('sig')

681

return revision_store

682

683

def initialize(self, a_bzrdir, shared=False):

684

"""Initialize a repository of this format in a_bzrdir.

685

686

:param a_bzrdir: The bzrdir to put the new repository in it.

687

:param shared: The repository should be initialized as a sharable one.

688

689

This may raise UninitializableFormat if shared repository are not

690

compatible the a_bzrdir.

691

"""

692

693

def is_supported(self):

694

"""Is this format supported?

695

696

Supported formats must be initializable and openable.

697

Unsupported formats may not support initialization or committing or

698

some other features depending on the reason for not being supported.

699

"""

700

return True

701

702

def open(self, a_bzrdir, _found=False):

703

"""Return an instance of this format for the bzrdir a_bzrdir.

704

705

_found is a private parameter, do not use it.

706

"""

707

raise NotImplementedError(self.open)

708

709

@classmethod

710

def register_format(klass, format):

711

klass._formats[format.get_format_string()] = format

712

713

@classmethod

714

def set_default_format(klass, format):

715

klass._default_format = format

716

717

@classmethod

718

def unregister_format(klass, format):

719

assert klass._formats[format.get_format_string()] is format

720

del klass._formats[format.get_format_string()]

721

722

723

class PreSplitOutRepositoryFormat(RepositoryFormat):

724

"""Base class for the pre split out repository formats."""

725

726

def initialize(self, a_bzrdir, shared=False, _internal=False):

727

"""Create a weave repository.

728

729

TODO: when creating split out bzr branch formats, move this to a common

730

base for Format5, Format6. or something like that.

731

"""

732

from bzrlib.weavefile import write_weave_v5

733

from bzrlib.weave import Weave

734

735

if shared:

736

raise errors.IncompatibleFormat(self, a_bzrdir._format)

737

738

if not _internal:

739

# always initialized when the bzrdir is.

740

return self.open(a_bzrdir, _found=True)

741

742

# Create an empty weave

743

sio = StringIO()

744

bzrlib.weavefile.write_weave_v5(Weave(), sio)

745

empty_weave = sio.getvalue()

746

747

mutter('creating repository in %s.', a_bzrdir.transport.base)

748

dirs = ['revision-store', 'weaves']

749

lock_file = 'branch-lock'

750

files = [('inventory.weave', StringIO(empty_weave)),

751

]

752

753

# FIXME: RBC 20060125 dont peek under the covers

754

# NB: no need to escape relative paths that are url safe.

755

control_files = LockableFiles(a_bzrdir.transport, 'branch-lock')

756

control_files.lock_write()

757

control_files._transport.mkdir_multi(dirs,

758

mode=control_files._dir_mode)

759

try:

760

for file, content in files:

761

control_files.put(file, content)

762

finally:

763

control_files.unlock()

764

return self.open(a_bzrdir, _found=True)

765

766

def open(self, a_bzrdir, _found=False):

767

"""See RepositoryFormat.open()."""

768

if not _found:

769

# we are being called directly and must probe.

770

raise NotImplementedError

771

772

repo_transport = a_bzrdir.get_repository_transport(None)

773

control_files = a_bzrdir._control_files

774

revision_store = self._get_revision_store(repo_transport, control_files)

775

return AllInOneRepository(_format=self,

776

a_bzrdir=a_bzrdir,

777

revision_store=revision_store)

778

779

780

class RepositoryFormat4(PreSplitOutRepositoryFormat):

781

"""Bzr repository format 4.

782

783

This repository format has:

784

- flat stores

785

- TextStores for texts, inventories,revisions.

786

787

This format is deprecated: it indexes texts using a text id which is

788

removed in format 5; initializationa and write support for this format

789

has been removed.

790

"""

791

792

def __init__(self):

793

super(RepositoryFormat4, self).__init__()

794

self._matchingbzrdir = bzrlib.bzrdir.BzrDirFormat4()

795

796

def initialize(self, url, shared=False, _internal=False):

797

"""Format 4 branches cannot be created."""

798

raise errors.UninitializableFormat(self)

799

800

def is_supported(self):

801

"""Format 4 is not supported.

802

803

It is not supported because the model changed from 4 to 5 and the

804

conversion logic is expensive - so doing it on the fly was not

805

feasible.

806

"""

807

return False

808

809

def _get_revision_store(self, repo_transport, control_files):

810

"""See RepositoryFormat._get_revision_store()."""

811

return self._get_rev_store(repo_transport,

812

control_files,

813

'revision-store')

814

815

816

class RepositoryFormat5(PreSplitOutRepositoryFormat):

817

"""Bzr control format 5.

818

819

This repository format has:

820

- weaves for file texts and inventory

821

- flat stores

822

- TextStores for revisions and signatures.

823

"""

824

825

def __init__(self):

826

super(RepositoryFormat5, self).__init__()

827

self._matchingbzrdir = bzrlib.bzrdir.BzrDirFormat5()

828

829

def _get_revision_store(self, repo_transport, control_files):

830

"""See RepositoryFormat._get_revision_store()."""

831

"""Return the revision store object for this a_bzrdir."""

832

return self._get_rev_store(repo_transport,

833

control_files,

834

'revision-store',

835

compressed=False)

836

837

838

class RepositoryFormat6(PreSplitOutRepositoryFormat):

839

"""Bzr control format 6.

840

841

This repository format has:

842

- weaves for file texts and inventory

843

- hash subdirectory based stores.

844

- TextStores for revisions and signatures.

845

"""

846

847

def __init__(self):

848

super(RepositoryFormat6, self).__init__()

849

self._matchingbzrdir = bzrlib.bzrdir.BzrDirFormat6()

850

851

def _get_revision_store(self, repo_transport, control_files):

852

"""See RepositoryFormat._get_revision_store()."""

853

return self._get_rev_store(repo_transport,

854

control_files,

855

'revision-store',

856

compressed=False,

857

prefixed=True)

858

859

860

class MetaDirRepositoryFormat(RepositoryFormat):

861

"""Common base class for the new repositories using the metadir layour."""

862

863

def __init__(self):

864

super(MetaDirRepositoryFormat, self).__init__()

865

self._matchingbzrdir = bzrlib.bzrdir.BzrDirMetaFormat1()

866

867

def _create_control_files(self, a_bzrdir):

868

"""Create the required files and the initial control_files object."""

869

# FIXME: RBC 20060125 dont peek under the covers

870

# NB: no need to escape relative paths that are url safe.

871

lock_file = 'lock'

872

repository_transport = a_bzrdir.get_repository_transport(self)

873

repository_transport.put(lock_file, StringIO()) # TODO get the file mode from the bzrdir lock files., mode=file_mode)

874

control_files = LockableFiles(repository_transport, 'lock')

875

return control_files

876

877

def _get_revision_store(self, repo_transport, control_files):

878

"""See RepositoryFormat._get_revision_store()."""

879

return self._get_rev_store(repo_transport,

880

control_files,

881

'revision-store',

882

compressed=False,

883

prefixed=True,

884

)

885

886

def open(self, a_bzrdir, _found=False, _override_transport=None):

887

"""See RepositoryFormat.open().

888

889

:param _override_transport: INTERNAL USE ONLY. Allows opening the

890

repository at a slightly different url

891

than normal. I.e. during 'upgrade'.

892

"""

893

if not _found:

894

format = RepositoryFormat.find_format(a_bzrdir)

895

assert format.__class__ == self.__class__

896

if _override_transport is not None:

897

repo_transport = _override_transport

898

else:

899

repo_transport = a_bzrdir.get_repository_transport(None)

900

control_files = LockableFiles(repo_transport, 'lock')

901

revision_store = self._get_revision_store(repo_transport, control_files)

902

return MetaDirRepository(_format=self,

903

a_bzrdir=a_bzrdir,

904

control_files=control_files,

905

revision_store=revision_store)

906

907

def _upload_blank_content(self, a_bzrdir, dirs, files, utf8_files, shared):

908

"""Upload the initial blank content."""

909

control_files = self._create_control_files(a_bzrdir)

910

control_files.lock_write()

911

control_files._transport.mkdir_multi(dirs,

912

mode=control_files._dir_mode)

913

try:

914

for file, content in files:

915

control_files.put(file, content)

916

for file, content in utf8_files:

917

control_files.put_utf8(file, content)

918

if shared == True:

919

control_files.put_utf8('shared-storage', '')

920

finally:

921

control_files.unlock()

922

923

924

class RepositoryFormat7(MetaDirRepositoryFormat):

925

"""Bzr repository 7.

926

927

This repository format has:

928

- weaves for file texts and inventory

929

- hash subdirectory based stores.

930

- TextStores for revisions and signatures.

931

- a format marker of its own

932

- an optional 'shared-storage' flag

933

- an optional 'no-working-trees' flag

934

"""

935

936

def get_format_string(self):

937

"""See RepositoryFormat.get_format_string()."""

938

return "Bazaar-NG Repository format 7"

939

940

def initialize(self, a_bzrdir, shared=False):

941

"""Create a weave repository.

942

943

:param shared: If true the repository will be initialized as a shared

944

repository.

945

"""

946

from bzrlib.weavefile import write_weave_v5

947

from bzrlib.weave import Weave

948

949

# Create an empty weave

950

sio = StringIO()

951

bzrlib.weavefile.write_weave_v5(Weave(), sio)

952

empty_weave = sio.getvalue()

953

954

mutter('creating repository in %s.', a_bzrdir.transport.base)

955

dirs = ['revision-store', 'weaves']

956

files = [('inventory.weave', StringIO(empty_weave)),

957

]

958

utf8_files = [('format', self.get_format_string())]

959

960

self._upload_blank_content(a_bzrdir, dirs, files, utf8_files, shared)

961

return self.open(a_bzrdir=a_bzrdir, _found=True)

962

963

964

class RepositoryFormatKnit1(MetaDirRepositoryFormat):

965

"""Bzr repository knit format 1.

966

967

This repository format has:

968

- knits for file texts and inventory

969

- hash subdirectory based stores.

970

- knits for revisions and signatures

971

- TextStores for revisions and signatures.

972

- a format marker of its own

973

- an optional 'shared-storage' flag

974

- an optional 'no-working-trees' flag

975

"""

976

977

def get_format_string(self):

978

"""See RepositoryFormat.get_format_string()."""

979

return "Bazaar-NG Knit Repository Format 1"

980

981

def initialize(self, a_bzrdir, shared=False):

982

"""Create a knit format 1 repository.

983

984

:param shared: If true the repository will be initialized as a shared

985

repository.

986

XXX NOTE that this current uses a Weave for testing and will become

987

A Knit in due course.

988

"""

989

from bzrlib.weavefile import write_weave_v5

990

from bzrlib.weave import Weave

991

992

# Create an empty weave

993

sio = StringIO()

994

bzrlib.weavefile.write_weave_v5(Weave(), sio)

995

empty_weave = sio.getvalue()

996

997

mutter('creating repository in %s.', a_bzrdir.transport.base)

998

dirs = ['revision-store', 'knits']

999

files = [('inventory.weave', StringIO(empty_weave)),

1000

]

1001

utf8_files = [('format', self.get_format_string())]

1002

1003

self._upload_blank_content(a_bzrdir, dirs, files, utf8_files, shared)

1004

return self.open(a_bzrdir=a_bzrdir, _found=True)

1005

1006

1007

# formats which have no format string are not discoverable

1008

# and not independently creatable, so are not registered.

1009

_default_format = RepositoryFormat7()

1010

RepositoryFormat.register_format(_default_format)

1011

RepositoryFormat.register_format(RepositoryFormatKnit1())

1012

RepositoryFormat.set_default_format(_default_format)

1013

_legacy_formats = [RepositoryFormat4(),

1014

RepositoryFormat5(),

1015

RepositoryFormat6()]

1016

1017

1018

class InterRepository(object):

1019

"""This class represents operations taking place between two repositories.

1020

1021

Its instances have methods like copy_content and fetch, and contain

1022

references to the source and target repositories these operations can be

1023

carried out on.

1024

1025

Often we will provide convenience methods on 'repository' which carry out

1026

operations with another repository - they will always forward to

1027

InterRepository.get(other).method_name(parameters).

1028

"""

1029

# XXX: FIXME: FUTURE: robertc

1030

# testing of these probably requires a factory in optimiser type, and

1031

# then a test adapter to test each type thoroughly.

1032

1033

1034

_optimisers = set()

1035

"""The available optimised InterRepository types."""

1036

1037

def __init__(self, source, target):

1038

"""Construct a default InterRepository instance. Please use 'get'.

1039

1040

Only subclasses of InterRepository should call

1041

InterRepository.__init__ - clients should call InterRepository.get

1042

instead which will create an optimised InterRepository if possible.

1043

"""

1044

self.source = source

1045

self.target = target

1046

1047

@needs_write_lock

1048

def copy_content(self, revision_id=None, basis=None):

1049

"""Make a complete copy of the content in self into destination.

1050

1051

This is a destructive operation! Do not use it on existing

1052

repositories.

1053

1054

:param revision_id: Only copy the content needed to construct

1055

revision_id and its parents.

1056

:param basis: Copy the needed data preferentially from basis.

1057

"""

1058

try:

1059

self.target.set_make_working_trees(self.source.make_working_trees())

1060

except NotImplementedError:

1061

pass

1062

# grab the basis available data

1063

if basis is not None:

1064

self.target.fetch(basis, revision_id=revision_id)

1065

# but dont both fetching if we have the needed data now.

1066

if (revision_id not in (None, NULL_REVISION) and

1067

self.target.has_revision(revision_id)):

1068

return

1069

self.target.fetch(self.source, revision_id=revision_id)

1070

1071

def _double_lock(self, lock_source, lock_target):

1072

"""Take out too locks, rolling back the first if the second throws."""

1073

lock_source()

1074

try:

1075

lock_target()

1076

except Exception:

1077

# we want to ensure that we don't leave source locked by mistake.

1078

# and any error on target should not confuse source.

1079

self.source.unlock()

1080

raise

1081

1082

@needs_write_lock

1083

def fetch(self, revision_id=None, pb=None):

1084

"""Fetch the content required to construct revision_id.

1085

1086

The content is copied from source to target.

1087

1088

:param revision_id: if None all content is copied, if NULL_REVISION no

1089

content is copied.

1090

:param pb: optional progress bar to use for progress reports. If not

1091

provided a default one will be created.

1092

1093

Returns the copied revision count and the failed revisions in a tuple:

1094

(copied, failures).

1095

"""

1096

from bzrlib.fetch import RepoFetcher

1097

mutter("Using fetch logic to copy between %s(%s) and %s(%s)",

1098

self.source, self.source._format, self.target, self.target._format)

1099

f = RepoFetcher(to_repository=self.target,

1100

from_repository=self.source,

1101

last_revision=revision_id,

1102

pb=pb)

1103

return f.count_copied, f.failed_revisions

1104

1105

@classmethod

1106

def get(klass, repository_source, repository_target):

1107

"""Retrieve a InterRepository worker object for these repositories.

1108

1109

:param repository_source: the repository to be the 'source' member of

1110

the InterRepository instance.

1111

:param repository_target: the repository to be the 'target' member of

1112

the InterRepository instance.

1113

If an optimised InterRepository worker exists it will be used otherwise

1114

a default InterRepository instance will be created.

1115

"""

1116

for provider in klass._optimisers:

1117

if provider.is_compatible(repository_source, repository_target):

1118

return provider(repository_source, repository_target)

1119

return InterRepository(repository_source, repository_target)

1120

1121

def lock_read(self):

1122

"""Take out a logical read lock.

1123

1124

This will lock the source branch and the target branch. The source gets

1125

a read lock and the target a read lock.

1126

"""

1127

self._double_lock(self.source.lock_read, self.target.lock_read)

1128

1129

def lock_write(self):

1130

"""Take out a logical write lock.

1131

1132

This will lock the source branch and the target branch. The source gets

1133

a read lock and the target a write lock.

1134

"""

1135

self._double_lock(self.source.lock_read, self.target.lock_write)

1136

1137

@needs_read_lock

1138

def missing_revision_ids(self, revision_id=None):

1139

"""Return the revision ids that source has that target does not.

1140

1141

These are returned in topological order.

1142

1143

:param revision_id: only return revision ids included by this

1144

revision_id.

1145

"""

1146

# generic, possibly worst case, slow code path.

1147

target_ids = set(self.target.all_revision_ids())

1148

if revision_id is not None:

1149

source_ids = self.source.get_ancestry(revision_id)

1150

assert source_ids.pop(0) == None

1151

else:

1152

source_ids = self.source.all_revision_ids()

1153

result_set = set(source_ids).difference(target_ids)

1154

# this may look like a no-op: its not. It preserves the ordering

1155

# other_ids had while only returning the members from other_ids

1156

# that we've decided we need.

1157

return [rev_id for rev_id in source_ids if rev_id in result_set]

1158

1159

@classmethod

1160

def register_optimiser(klass, optimiser):

1161

"""Register an InterRepository optimiser."""

1162

klass._optimisers.add(optimiser)

1163

1164

def unlock(self):

1165

"""Release the locks on source and target."""

1166

try:

1167

self.target.unlock()

1168

finally:

1169

self.source.unlock()

1170

1171

@classmethod

1172

def unregister_optimiser(klass, optimiser):

1173

"""Unregister an InterRepository optimiser."""

1174

klass._optimisers.remove(optimiser)

1175

1176

1177

class InterWeaveRepo(InterRepository):

1178

"""Optimised code paths between Weave based repositories."""

1179

1180

_matching_repo_format = _default_format

1181

"""Repository format for testing with."""

1182

1183

@staticmethod

1184

def is_compatible(source, target):

1185

"""Be compatible with known Weave formats.

1186

1187

We dont test for the stores being of specific types becase that

1188

could lead to confusing results, and there is no need to be

1189

overly general.

1190

"""

1191

try:

1192

return (isinstance(source._format, (RepositoryFormat5,

1193

RepositoryFormat6,

1194

RepositoryFormat7)) and

1195

isinstance(target._format, (RepositoryFormat5,

1196

RepositoryFormat6,

1197

RepositoryFormat7)))

1198

except AttributeError:

1199

return False

1200

1201

@needs_write_lock

1202

def copy_content(self, revision_id=None, basis=None):

1203

"""See InterRepository.copy_content()."""

1204

# weave specific optimised path:

1205

if basis is not None:

1206

# copy the basis in, then fetch remaining data.

1207

basis.copy_content_into(self.target, revision_id)

1208

# the basis copy_content_into could misset this.

1209

try:

1210

self.target.set_make_working_trees(self.source.make_working_trees())

1211

except NotImplementedError:

1212

pass

1213

self.target.fetch(self.source, revision_id=revision_id)

1214

else:

1215

try:

1216

self.target.set_make_working_trees(self.source.make_working_trees())

1217

except NotImplementedError:

1218

pass

1219

# FIXME do not peek!

1220

if self.source.control_files._transport.listable():

1221

pb = bzrlib.ui.ui_factory.progress_bar()

1222

copy_all(self.source.weave_store,

1223

self.target.weave_store, pb=pb)

1224

pb.update('copying inventory', 0, 1)

1225

self.target.control_weaves.copy_multi(

1226

self.source.control_weaves, ['inventory'])

1227

copy_all(self.source.revision_store,

1228

self.target.revision_store, pb=pb)

1229

else:

1230

self.target.fetch(self.source, revision_id=revision_id)

1231

1232

@needs_write_lock

1233

def fetch(self, revision_id=None, pb=None):

1234

"""See InterRepository.fetch()."""

1235

from bzrlib.fetch import RepoFetcher

1236

mutter("Using fetch logic to copy between %s(%s) and %s(%s)",

1237

self.source, self.source._format, self.target, self.target._format)

1238

f = RepoFetcher(to_repository=self.target,

1239

from_repository=self.source,

1240

last_revision=revision_id,

1241

pb=pb)

1242

return f.count_copied, f.failed_revisions

1243

1244

@needs_read_lock

1245

def missing_revision_ids(self, revision_id=None):

1246

"""See InterRepository.missing_revision_ids()."""

1247

# we want all revisions to satisfy revision_id in source.

1248

# but we dont want to stat every file here and there.

1249

# we want then, all revisions other needs to satisfy revision_id

1250

# checked, but not those that we have locally.

1251

# so the first thing is to get a subset of the revisions to

1252

# satisfy revision_id in source, and then eliminate those that

1253

# we do already have.

1254

# this is slow on high latency connection to self, but as as this

1255

# disk format scales terribly for push anyway due to rewriting

1256

# inventory.weave, this is considered acceptable.

1257

# - RBC 20060209

1258

if revision_id is not None:

1259

source_ids = self.source.get_ancestry(revision_id)

1260

assert source_ids.pop(0) == None

1261

else:

1262

source_ids = self.source._all_possible_ids()

1263

source_ids_set = set(source_ids)

1264

# source_ids is the worst possible case we may need to pull.

1265

# now we want to filter source_ids against what we actually

1266

# have in target, but dont try to check for existence where we know

1267

# we do not have a revision as that would be pointless.

1268

target_ids = set(self.target._all_possible_ids())

1269

possibly_present_revisions = target_ids.intersection(source_ids_set)

1270

actually_present_revisions = set(self.target._eliminate_revisions_not_present(possibly_present_revisions))

1271

required_revisions = source_ids_set.difference(actually_present_revisions)

1272

required_topo_revisions = [rev_id for rev_id in source_ids if rev_id in required_revisions]

1273

if revision_id is not None:

1274

# we used get_ancestry to determine source_ids then we are assured all

1275

# revisions referenced are present as they are installed in topological order.

1276

# and the tip revision was validated by get_ancestry.

1277

return required_topo_revisions

1278

else:

1279

# if we just grabbed the possibly available ids, then

1280

# we only have an estimate of whats available and need to validate

1281

# that against the revision records.

1282

return self.source._eliminate_revisions_not_present(required_topo_revisions)

1283

1284

1285

InterRepository.register_optimiser(InterWeaveRepo)

1286

1287

1288

class RepositoryTestProviderAdapter(object):

1289

"""A tool to generate a suite testing multiple repository formats at once.

1290

1291

This is done by copying the test once for each transport and injecting

1292

the transport_server, transport_readonly_server, and bzrdir_format and

1293

repository_format classes into each copy. Each copy is also given a new id()

1294

to make it easy to identify.

1295

"""

1296

1297

def __init__(self, transport_server, transport_readonly_server, formats):

1298

self._transport_server = transport_server

1299

self._transport_readonly_server = transport_readonly_server

1300

self._formats = formats

1301

1302

def adapt(self, test):

1303

result = TestSuite()

1304

for repository_format, bzrdir_format in self._formats:

1305

new_test = deepcopy(test)

1306

new_test.transport_server = self._transport_server

1307

new_test.transport_readonly_server = self._transport_readonly_server

1308

new_test.bzrdir_format = bzrdir_format

1309

new_test.repository_format = repository_format

1310

def make_new_test_id():

1311

new_id = "%s(%s)" % (new_test.id(), repository_format.__class__.__name__)

1312

return lambda: new_id

1313

new_test.id = make_new_test_id()

1314

result.addTest(new_test)

1315

return result

1316

1317

1318

class InterRepositoryTestProviderAdapter(object):

1319

"""A tool to generate a suite testing multiple inter repository formats.

1320

1321

This is done by copying the test once for each interrepo provider and injecting

1322

the transport_server, transport_readonly_server, repository_format and

1323

repository_to_format classes into each copy.

1324

Each copy is also given a new id() to make it easy to identify.

1325

"""

1326

1327

def __init__(self, transport_server, transport_readonly_server, formats):

1328

self._transport_server = transport_server

1329

self._transport_readonly_server = transport_readonly_server

1330

self._formats = formats

1331

1332

def adapt(self, test):

1333

result = TestSuite()

1334

for interrepo_class, repository_format, repository_format_to in self._formats:

1335

new_test = deepcopy(test)

1336

new_test.transport_server = self._transport_server

1337

new_test.transport_readonly_server = self._transport_readonly_server

1338

new_test.interrepo_class = interrepo_class

1339

new_test.repository_format = repository_format

1340

new_test.repository_format_to = repository_format_to

1341

def make_new_test_id():

1342

new_id = "%s(%s)" % (new_test.id(), interrepo_class.__name__)

1343

return lambda: new_id

1344

new_test.id = make_new_test_id()

1345

result.addTest(new_test)

1346

return result

1347

1348

@staticmethod

1349

def default_test_list():

1350

"""Generate the default list of interrepo permutations to test."""

1351

result = []

1352

# test the default InterRepository between format 6 and the current

1353

# default format.

1354

# XXX: robertc 20060220 reinstate this when there are two supported

1355

# formats which do not have an optimal code path between them.

1356

result.append((InterRepository,

1357

RepositoryFormat6(),

1358

RepositoryFormatKnit1()))

1359

for optimiser in InterRepository._optimisers:

1360

result.append((optimiser,

1361

optimiser._matching_repo_format,

1362

optimiser._matching_repo_format

1363

))

1364

# if there are specific combinations we want to use, we can add them

1365

# here.

1366

return result

1367

1368

1369

class CopyConverter(object):

1370

"""A repository conversion tool which just performs a copy of the content.

1371

1372

This is slow but quite reliable.

1373

"""

1374

1375

def __init__(self, target_format):

1376

"""Create a CopyConverter.

1377

1378

:param target_format: The format the resulting repository should be.

1379

"""

1380

self.target_format = target_format

1381

1382

def convert(self, repo, pb):

1383

"""Perform the conversion of to_convert, giving feedback via pb.

1384

1385

:param to_convert: The disk object to convert.

1386

:param pb: a progress bar to use for progress information.

1387

"""

1388

self.pb = pb

1389

self.count = 0

1390

self.total = 3

1391

# this is only useful with metadir layouts - separated repo content.

1392

# trigger an assertion if not such

1393

repo._format.get_format_string()

1394

self.repo_dir = repo.bzrdir

1395

self.step('Moving repository to repository.backup')

1396

self.repo_dir.transport.move('repository', 'repository.backup')

1397

backup_transport = self.repo_dir.transport.clone('repository.backup')

1398

self.source_repo = repo._format.open(self.repo_dir,

1399

_found=True,

1400

_override_transport=backup_transport)

1401

self.step('Creating new repository')

1402

converted = self.target_format.initialize(self.repo_dir,

1403

self.source_repo.is_shared())

1404

converted.lock_write()

1405

try:

1406

self.step('Copying content into repository.')

1407

self.source_repo.copy_content_into(converted)

1408

finally:

1409

converted.unlock()

1410

self.step('Deleting old repository content.')

1411

self.repo_dir.transport.delete_tree('repository.backup')

1412

self.pb.note('repository converted')

1413

1414

def step(self, message):

1415

"""Update the pb by a step."""

1416

self.count +=1

1417

self.pb.update(message, self.count, self.total)

Older »