/brz/remove-bazaar : revision 1596.2.35

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/fetch.py

Committer: Robert Collins
Date: 2006-03-12 17:09:11 UTC
mto: (1615.1.2 bzr.mbp.integration)
mto: This revision was merged to the branch mainline in revision 1616.
Revision ID: robertc@robertcollins.net-20060312170911-306a47e0478ec183

Subclass SequenceMatcher to get a slightly faster (in our case) find_longest_match routine.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py.moved

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

generate_docs.py

notes

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/fetch.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Copying of history from one branch to another.

The basic plan is that every branch knows the history of everything

that has merged into it. As the first step of a merge, pull, or

branch operation we copy history from the source into the destination

branch.

The copying is done in a slightly complicated order. We don't want to

add a revision to the store until everything it refers to is also

stored, so that if a revision is present we can totally recreate it.

However, we can't know what files are included in a revision until we

read its inventory. So we query the inventory store of the source for

the ids we need, and then pull those ids and finally actually join

the inventories.

"""

import bzrlib

import bzrlib.errors as errors

from bzrlib.errors import (InstallFailed, NoSuchRevision,

MissingText)

from bzrlib.trace import mutter

from bzrlib.reconcile import RepoReconciler

from bzrlib.revision import NULL_REVISION

from bzrlib.symbol_versioning import *

# TODO: Avoid repeatedly opening weaves so many times.

# XXX: This doesn't handle ghost (not present in branch) revisions at

# all yet. I'm not sure they really should be supported.

# NOTE: This doesn't copy revisions which may be present but not

# merged into the last revision. I'm not sure we want to do that.

# - get a list of revisions that need to be pulled in

# - for each one, pull in that revision file

# and get the inventory, and store the inventory with right

# parents.

# - and get the ancestry, and store that with right parents too

# - and keep a note of all file ids and version seen

# - then go through all files; for each one get the weave,

# and add in all file versions

@deprecated_function(zero_eight)

def greedy_fetch(to_branch, from_branch, revision=None, pb=None):

"""Legacy API, please see branch.fetch(from_branch, last_revision, pb)."""

f = Fetcher(to_branch, from_branch, revision, pb)

return f.count_copied, f.failed_revisions

fetch = greedy_fetch

class RepoFetcher(object):

"""Pull revisions and texts from one repository to another.

last_revision

if set, try to limit to the data this revision references.

after running:

count_copied -- number of revisions copied

This should not be used directory, its essential a object to encapsulate

the logic in InterRepository.fetch().

"""

def __init__(self, to_repository, from_repository, last_revision=None, pb=None):

# result variables.

self.failed_revisions = []

self.count_copied = 0

if to_repository.control_files._transport.base == from_repository.control_files._transport.base:

# check that last_revision is in 'from' and then return a no-operation.

if last_revision not in (None, NULL_REVISION):

from_repository.get_revision(last_revision)

return

self.to_repository = to_repository

self.from_repository = from_repository

# must not mutate self._last_revision as its potentially a shared instance

self._last_revision = last_revision

if pb is None:

self.pb = bzrlib.ui.ui_factory.nested_progress_bar()

self.nested_pb = self.pb

else:

100

self.pb = pb

101

self.nested_pb = None

102

self.from_repository.lock_read()

103

try:

104

self.to_repository.lock_write()

105

try:

106

self.__fetch()

107

finally:

108

if self.nested_pb is not None:

109

self.nested_pb.finished()

110

self.to_repository.unlock()

111

finally:

112

self.from_repository.unlock()

113

114

def __fetch(self):

115

"""Primary worker function.

116

117

This initialises all the needed variables, and then fetches the

118

requested revisions, finally clearing the progress bar.

119

"""

120

self.to_weaves = self.to_repository.weave_store

121

self.to_control = self.to_repository.control_weaves

122

self.from_weaves = self.from_repository.weave_store

123

self.from_control = self.from_repository.control_weaves

124

self.count_total = 0

125

self.file_ids_names = {}

126

self.total_steps = 4

127

try:

128

revs = self._revids_to_fetch()

129

# something to do ?

130

if revs:

131

self.pb.update('Fetching text', 1, self.total_steps)

132

self._fetch_weave_texts(revs)

133

self.pb.update('Fetching inventories', 2, self.total_steps)

134

self._fetch_inventory_weave(revs)

135

self.pb.update('Fetching revisions', 3, self.total_steps)

136

self._fetch_revision_texts(revs)

137

self.pb.update('Fetching revisions', 4, self.total_steps)

138

self.count_copied += len(revs)

139

finally:

140

self.pb.clear()

141

142

def _revids_to_fetch(self):

143

self.pb.update('Calculating needed data', 0, self.total_steps)

144

mutter('fetch up to rev {%s}', self._last_revision)

145

if self._last_revision is NULL_REVISION:

146

# explicit limit of no revisions needed

147

return None

148

if (self._last_revision != None and

149

self.to_repository.has_revision(self._last_revision)):

150

return None

151

152

try:

153

return self.to_repository.missing_revision_ids(self.from_repository,

154

self._last_revision)

155

except errors.NoSuchRevision:

156

raise InstallFailed([self._last_revision])

157

158

def _fetch_weave_texts(self, revs):

159

texts_pb = bzrlib.ui.ui_factory.nested_progress_bar()

160

try:

161

file_ids = self.from_repository.fileid_involved_by_set(revs)

162

count = 0

163

num_file_ids = len(file_ids)

164

for file_id in file_ids:

165

texts_pb.update("fetch texts", count, num_file_ids)

166

count +=1

167

try:

168

to_weave = self.to_weaves.get_weave(file_id,

169

self.to_repository.get_transaction())

170

except errors.NoSuchFile:

171

# destination is empty, just copy it.

172

# this copies all the texts, which is useful and

173

# on per-file basis quite cheap.

174

self.to_weaves.copy_multi(

175

self.from_weaves,

176

[file_id],

177

None,

178

self.from_repository.get_transaction(),

179

self.to_repository.get_transaction())

180

else:

181

# destination has contents, must merge

182

from_weave = self.from_weaves.get_weave(file_id,

183

self.from_repository.get_transaction())

184

# we fetch all the texts, because texts do

185

# not reference anything, and its cheap enough

186

to_weave.join(from_weave)

187

finally:

188

texts_pb.finished()

189

190

def _fetch_inventory_weave(self, revs):

191

inv_pb = bzrlib.ui.ui_factory.nested_progress_bar()

192

try:

193

inv_pb.update("fetch inventory", 0, 2)

194

to_weave = self.to_control.get_weave('inventory',

195

self.to_repository.get_transaction())

196

197

# just merge, this is optimisable and its means we dont

198

# copy unreferenced data such as not-needed inventories.

199

self.pb.update("fetch inventory", 1, 2)

200

from_weave = self.from_repository.get_inventory_weave()

201

self.pb.update("fetch inventory", 2, 2)

202

# we fetch only the referenced inventories because we do not

203

# know for unselected inventories whether all their required

204

# texts are present in the other repository - it could be

205

# corrupt.

206

to_weave.join(from_weave, msg='fetch inventory', version_ids=revs)

207

finally:

208

inv_pb.finished()

209

210

211

class GenericRepoFetcher(RepoFetcher):

212

"""This is a generic repo to repo fetcher.

213

214

This makes minimal assumptions about repo layout and contents.

215

It triggers a reconciliation after fetching to ensure integrity.

216

"""

217

218

def _fetch_revision_texts(self, revs):

219

rev_pb = bzrlib.ui.ui_factory.nested_progress_bar()

220

try:

221

self.to_transaction = self.to_repository.get_transaction()

222

count = 0

223

total = len(revs)

224

for rev in revs:

225

rev_pb.update('fetch revisions', count, total)

226

try:

227

sig_text = self.from_repository.get_signature_text(rev)

228

self.to_repository._revision_store.add_revision_signature_text(

229

rev, sig_text, self.to_transaction)

230

except errors.NoSuchRevision:

231

# not signed.

232

pass

233

self.to_repository._revision_store.add_revision(

234

self.from_repository.get_revision(rev),

235

self.to_transaction)

236

count += 1

237

rev_pb.update('copying revisions', count, total)

238

# fixup inventory if needed:

239

# this is expensive because we have no inverse index to current ghosts.

240

# but on local disk its a few seconds and sftp push is already insane.

241

# so we just-do-it.

242

# FIXME: repository should inform if this is needed.

243

self.to_repository.reconcile()

244

finally:

245

rev_pb.finished()

246

247

248

class KnitRepoFetcher(RepoFetcher):

249

"""This is a knit format repository specific fetcher.

250

251

This differs from the GenericRepoFetcher by not doing a

252

reconciliation after copying, and using knit joining to

253

copy revision texts.

254

"""

255

256

def _fetch_revision_texts(self, revs):

257

# may need to be a InterRevisionStore call here.

258

from_transaction = self.from_repository.get_transaction()

259

to_transaction = self.to_repository.get_transaction()

260

to_sf = self.to_repository._revision_store.get_signature_file(

261

to_transaction)

262

from_sf = self.from_repository._revision_store.get_signature_file(

263

from_transaction)

264

to_sf.join(from_sf, version_ids=revs, ignore_missing=True)

265

to_rf = self.to_repository._revision_store.get_revision_file(

266

to_transaction)

267

from_rf = self.from_repository._revision_store.get_revision_file(

268

from_transaction)

269

to_rf.join(from_rf, version_ids=revs)

270

271

272

class Fetcher(object):

273

"""Backwards compatability glue for branch.fetch()."""

274

275

@deprecated_method(zero_eight)

276

def __init__(self, to_branch, from_branch, last_revision=None, pb=None):

277

"""Please see branch.fetch()."""

278

to_branch.fetch(from_branch, last_revision, pb)

Older »