/brz/remove-bazaar : revision 1239

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/fetch.py

Committer: Martin Pool
Date: 2005-09-13 23:08:19 UTC
Revision ID: mbp@sourcefrog.net-20050913230819-6ceae96050d32faa

ignore .bzr-shelf

files added:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

README

TODO

build-api

bzr-man.py

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/selftest

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/weavestore.py

bzrlib/workingtree.py

bzrlib/xml.py

bzrlib/xml5.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

setup.py

testbzr

testsweet.py

tools

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/history2weaves.py

tools/http_client.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/fetch.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

import sys

import os

from cStringIO import StringIO

import bzrlib.errors

from bzrlib.trace import mutter, note, warning

from bzrlib.branch import Branch, INVENTORY_FILEID, ANCESTRY_FILEID

from bzrlib.progress import ProgressBar

from bzrlib.xml5 import serializer_v5

from bzrlib.osutils import sha_string, split_lines

"""Copying of history from one branch to another.

The basic plan is that every branch knows the history of everything

that has merged into it. As the first step of a merge, pull, or

branch operation we copy history from the source into the destination

branch.

The copying is done in a slightly complicated order. We don't want to

add a revision to the store until everything it refers to is also

stored, so that if a revision is present we can totally recreate it.

However, we can't know what files are included in a revision until we

read its inventory. Therefore, we first pull the XML and hold it in

memory until we've updated all of the files referenced.

"""

# TODO: Avoid repeatedly opening weaves so many times.

# XXX: This doesn't handle ghost (not present in branch) revisions at

# all yet.

# - get a list of revisions that need to be pulled in

# - for each one, pull in that revision file

# and get the inventory, and store the inventory with right

# parents.

# - and get the ancestry, and store that with right parents too

# - and keep a note of all file ids and version seen

# - then go through all files; for each one get the weave,

# and add in all file versions

def greedy_fetch(to_branch, from_branch, revision, pb):

f = Fetcher(to_branch, from_branch, revision, pb)

return f.count_copied, f.failed_revisions

class Fetcher(object):

"""Pull history from one branch to another.

revision_limit

If set, pull only up to this revision_id.

"""

def __init__(self, to_branch, from_branch, revision_limit=None, pb=None):

self.to_branch = to_branch

self.from_branch = from_branch

self.revision_limit = revision_limit

self.failed_revisions = []

self.count_copied = 0

if pb is None:

self.pb = bzrlib.ui.ui_factory.progress_bar()

else:

self.pb = pb

self._load_histories()

revs_to_fetch = self._compare_ancestries()

self._copy_revisions(revs_to_fetch)

def _load_histories(self):

"""Load histories of both branches, up to the limit."""

self.from_history = self.from_branch.revision_history()

self.to_history = self.to_branch.revision_history()

if self.revision_limit:

assert isinstance(revision_limit, basestring)

try:

rev_index = self.from_history.index(revision_limit)

except ValueError:

rev_index = None

if rev_index is not None:

self.from_history = self.from_history[:rev_index + 1]

else:

self.from_history = [revision]

100

def _compare_ancestries(self):

101

"""Get a list of revisions that must be copied.

102

103

That is, every revision that's in the ancestry of the source

104

branch and not in the destination branch."""

105

if self.from_history:

106

self.from_ancestry = self.from_branch.get_ancestry(self.from_history[-1])

107

else:

108

self.from_ancestry = []

109

if self.to_history:

110

self.to_history = self.to_branch.get_ancestry(self.to_history[-1])

111

else:

112

self.to_history = []

113

ss = set(self.to_history)

114

to_fetch = []

115

for rev_id in self.from_ancestry:

116

if rev_id not in ss:

117

to_fetch.append(rev_id)

118

mutter('need to get revision {%s}', rev_id)

119

mutter('need to get %d revisions in total', len(to_fetch))

120

return to_fetch

121

122

123

124

def _copy_revisions(self, revs_to_fetch):

125

for rev_id in revs_to_fetch:

126

self._copy_one_revision(rev_id)

127

128

129

def _copy_one_revision(self, rev_id):

130

"""Copy revision and everything referenced by it."""

131

mutter('copying revision {%s}', rev_id)

132

rev_xml = self.from_branch.get_revision_xml(rev_id)

133

inv_xml = self.from_branch.get_inventory_xml(rev_id)

134

rev = serializer_v5.read_revision_from_string(rev_xml)

135

inv = serializer_v5.read_inventory_from_string(inv_xml)

136

assert rev.revision_id == rev_id

137

assert rev.inventory_sha1 == sha_string(inv_xml)

138

mutter(' commiter %s, %d parents',

139

rev.committer,

140

len(rev.parents))

141

self._copy_new_texts(rev_id, inv)

142

self.to_branch.weave_store.add_text(INVENTORY_FILEID, rev_id,

143

split_lines(inv_xml), rev.parents)

144

self.to_branch.revision_store.add(StringIO(rev_xml), rev_id)

145

146

147

def _copy_new_texts(self, rev_id, inv):

148

"""Copy any new texts occuring in this revision."""

149

# TODO: Rather than writing out weaves every time, hold them

150

# in memory until everything's done? But this way is nicer

151

# if it's interrupted.

152

for path, ie in inv.iter_entries():

153

if ie.kind != 'file':

154

continue

155

if ie.text_version != rev_id:

156

continue

157

mutter('%s {%s} is changed in this revision',

158

path, ie.file_id)

159

self._copy_one_text(rev_id, ie.file_id)

160

161

162

def _copy_one_text(self, rev_id, file_id):

163

"""Copy one file text."""

164

from_weave = self.from_branch.weave_store.get_weave(file_id)

165

from_idx = from_weave.lookup(rev_id)

166

from_parents = map(from_weave.idx_to_name, from_weave.parents(from_idx))

167

text_lines = from_weave.get(from_idx)

168

to_weave = self.to_branch.weave_store.get_weave_or_empty(file_id)

169

to_parents = map(to_weave.lookup, from_parents)

170

# it's ok to add even if the text is already there

171

to_weave.add(rev_id, to_parents, text_lines)

172

self.to_branch.weave_store.put_weave(file_id, to_weave)

Older »