/brz/remove-bazaar : revision 1390

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/fetch.py

Committer: Robert Collins
Date: 2005-09-27 07:24:40 UTC
mfrom: (1185.1.41)
Revision ID: robertc@robertcollins.net-20050927072440-1bf4d99c3e1db5b3

pair programming worx... merge integration and weave

files added:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr-man.py

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_revision_info.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testremotebranch.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/weavestore.py

bzrlib/workingtree.py

bzrlib/xml.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/symlink-support.patch

setup.py

testbzr

testsweet.py

tools

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/fetch.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

import os

from cStringIO import StringIO

import bzrlib.errors

from bzrlib.trace import mutter, note, warning

from bzrlib.branch import Branch

from bzrlib.progress import ProgressBar

from bzrlib.xml5 import serializer_v5

from bzrlib.osutils import sha_string, split_lines

from bzrlib.errors import NoSuchRevision

"""Copying of history from one branch to another.

The basic plan is that every branch knows the history of everything

that has merged into it. As the first step of a merge, pull, or

branch operation we copy history from the source into the destination

branch.

The copying is done in a slightly complicated order. We don't want to

add a revision to the store until everything it refers to is also

stored, so that if a revision is present we can totally recreate it.

However, we can't know what files are included in a revision until we

read its inventory. Therefore, we first pull the XML and hold it in

memory until we've updated all of the files referenced.

"""

# TODO: Avoid repeatedly opening weaves so many times.

# XXX: This doesn't handle ghost (not present in branch) revisions at

# all yet. I'm not sure they really should be supported.

# NOTE: This doesn't copy revisions which may be present but not

# merged into the last revision. I'm not sure we want to do that.

# - get a list of revisions that need to be pulled in

# - for each one, pull in that revision file

# and get the inventory, and store the inventory with right

# parents.

# - and get the ancestry, and store that with right parents too

# - and keep a note of all file ids and version seen

# - then go through all files; for each one get the weave,

# and add in all file versions

def greedy_fetch(to_branch, from_branch, revision=None, pb=None):

f = Fetcher(to_branch, from_branch, revision, pb)

return f.count_copied, f.failed_revisions

class Fetcher(object):

"""Pull revisions and texts from one branch to another.

This doesn't update the destination's history; that can be done

separately if desired.

revision_limit

If set, pull only up to this revision_id.

After running:

last_revision -- if last_revision

is given it will be that, otherwise the last revision of

from_branch

count_copied -- number of revisions copied

count_texts -- number of file texts copied

"""

def __init__(self, to_branch, from_branch, last_revision=None, pb=None):

self.to_branch = to_branch

self.to_weaves = to_branch.weave_store

self.to_control = to_branch.control_weaves

self.from_branch = from_branch

self.from_weaves = from_branch.weave_store

self.from_control = from_branch.control_weaves

self.failed_revisions = []

self.count_copied = 0

self.count_total = 0

self.count_texts = 0

if pb is None:

self.pb = bzrlib.ui.ui_factory.progress_bar()

100

else:

101

self.pb = pb

102

self.last_revision = self._find_last_revision(last_revision)

103

mutter('fetch up to rev {%s}', self.last_revision)

104

revs_to_fetch = self._compare_ancestries()

105

self._copy_revisions(revs_to_fetch)

106

self.new_ancestry = revs_to_fetch

107

108

109

110

def _find_last_revision(self, last_revision):

111

"""Find the limiting source revision.

112

113

Every ancestor of that revision will be merged across.

114

115

Returns the revision_id, or returns None if there's no history

116

in the source branch."""

117

self.pb.update('get source history')

118

from_history = self.from_branch.revision_history()

119

self.pb.update('get destination history')

120

if last_revision:

121

if last_revision not in from_history:

122

raise NoSuchRevision(self.from_branch, last_revision)

123

else:

124

return last_revision

125

elif from_history:

126

return from_history[-1]

127

else:

128

return None # no history in the source branch

129

130

131

def _compare_ancestries(self):

132

"""Get a list of revisions that must be copied.

133

134

That is, every revision that's in the ancestry of the source

135

branch and not in the destination branch."""

136

self.pb.update('get source ancestry')

137

self.from_ancestry = self.from_branch.get_ancestry(self.last_revision)

138

139

dest_last_rev = self.to_branch.last_revision()

140

self.pb.update('get destination ancestry')

141

if dest_last_rev:

142

dest_ancestry = self.to_branch.get_ancestry(dest_last_rev)

143

else:

144

dest_ancestry = []

145

ss = set(dest_ancestry)

146

to_fetch = []

147

for rev_id in self.from_ancestry:

148

if rev_id not in ss:

149

to_fetch.append(rev_id)

150

mutter('need to get revision {%s}', rev_id)

151

mutter('need to get %d revisions in total', len(to_fetch))

152

self.count_total = len(to_fetch)

153

return to_fetch

154

155

156

157

def _copy_revisions(self, revs_to_fetch):

158

i = 0

159

for rev_id in revs_to_fetch:

160

i += 1

161

if rev_id is None:

162

continue

163

if self.to_branch.has_revision(rev_id):

164

continue

165

self.pb.update('fetch revision', i, self.count_total)

166

self._copy_one_revision(rev_id)

167

self.count_copied += 1

168

169

170

def _copy_one_revision(self, rev_id):

171

"""Copy revision and everything referenced by it."""

172

mutter('copying revision {%s}', rev_id)

173

rev_xml = self.from_branch.get_revision_xml(rev_id)

174

inv_xml = self.from_branch.get_inventory_xml(rev_id)

175

rev = serializer_v5.read_revision_from_string(rev_xml)

176

inv = serializer_v5.read_inventory_from_string(inv_xml)

177

assert rev.revision_id == rev_id

178

assert rev.inventory_sha1 == sha_string(inv_xml)

179

mutter(' commiter %s, %d parents',

180

rev.committer,

181

len(rev.parent_ids))

182

self._copy_new_texts(rev_id, inv)

183

self._copy_inventory(rev_id, inv_xml, rev.parent_ids)

184

self._copy_ancestry(rev_id, rev.parent_ids)

185

self.to_branch.revision_store.add(StringIO(rev_xml), rev_id)

186

187

188

def _copy_inventory(self, rev_id, inv_xml, parent_ids):

189

self.to_control.add_text('inventory', rev_id,

190

split_lines(inv_xml), parent_ids)

191

192

193

def _copy_ancestry(self, rev_id, parent_ids):

194

ancestry_lines = self.from_control.get_lines('ancestry', rev_id)

195

self.to_control.add_text('ancestry', rev_id, ancestry_lines,

196

parent_ids)

197

198

199

def _copy_new_texts(self, rev_id, inv):

200

"""Copy any new texts occuring in this revision."""

201

# TODO: Rather than writing out weaves every time, hold them

202

# in memory until everything's done? But this way is nicer

203

# if it's interrupted.

204

for path, ie in inv.iter_entries():

205

if ie.kind != 'file':

206

continue

207

if ie.text_version != rev_id:

208

continue

209

mutter('%s {%s} is changed in this revision',

210

path, ie.file_id)

211

self._copy_one_text(rev_id, ie.file_id)

212

213

214

def _copy_one_text(self, rev_id, file_id):

215

"""Copy one file text."""

216

mutter('copy text version {%s} of file {%s}',

217

rev_id, file_id)

218

from_weave = self.from_weaves.get_weave(file_id)

219

from_idx = from_weave.lookup(rev_id)

220

from_parents = map(from_weave.idx_to_name, from_weave.parents(from_idx))

221

text_lines = from_weave.get(from_idx)

222

to_weave = self.to_weaves.get_weave_or_empty(file_id)

223

to_parents = map(to_weave.lookup, from_parents)

224

# it's ok to add even if the text is already there

225

to_weave.add(rev_id, to_parents, text_lines)

226

self.to_weaves.put_weave(file_id, to_weave)

227

self.count_texts += 1

228

229

230

fetch = Fetcher

Older »