/brz/remove-bazaar : revision 1907.1.3

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: Aaron Bentley
Date: 2006-08-06 18:59:06 UTC
mto: (1731.1.34 nested-trees)
mto: This revision was merged to the branch mainline in revision 1910.
Revision ID: aaron.bentley@utoronto.ca-20060806185906-8c033dc32180fb00

Fixed unicode test cases

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revprops.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/README.1st

doc/configuration.txt

doc/default.css

doc/index.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

generate_docs.py

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/ostools.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: This refactoring of the workingtree code doesn't seem to keep

# the WorkingTree's copy of the inventory in sync with the branch. The

# branch modifies its working inventory when it does a commit to make

# missing files permanently removed.

# TODO: Maybe also keep the full path of the entry, and the children?

# But those depend on its position within a particular inventory, and

# it would be nice not to need to hold the backpointer here.

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import collections

import os.path

import re

import sys

import tarfile

import types

import bzrlib

from bzrlib import errors, osutils

from bzrlib.osutils import (pumpfile, quotefn, splitpath, joinpath,

pathjoin, sha_strings)

from bzrlib.errors import (NotVersionedError, InvalidEntryName,

BzrError, BzrCheckError, BinaryFile)

from bzrlib.trace import mutter

class InventoryEntry(object):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

file_id

name

(within the parent directory)

parent_id

file_id of the parent directory, or ROOT_ID

revision

the revision_id in which this variation of this file was

introduced.

executable

Indicates that this file should be executable on systems

that support it.

text_sha1

sha-1 of the text of the file

text_size

size in bytes of the text of the file

(reading a version 4 tree created a text_id field.)

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))

InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None)

>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))

InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None)

>>> shouldbe = {0: '', 1: 'src', 2: pathjoin('src','hello.c')}

>>> for ix, j in enumerate(i.iter_entries()):

... print (j[0] == shouldbe[ix], j[1])

...

(True, InventoryDirectory('TREE_ROOT', '', parent_id=None, revision=None))

(True, InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None))

(True, InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None))

>>> i.add(InventoryFile('2323', 'bye.c', '123'))

Traceback (most recent call last):

...

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryFile('2324', 'bye.c', '123'))

InventoryFile('2324', 'bye.c', parent_id='123', sha1=None, len=None)

>>> i.add(InventoryDirectory('2325', 'wibble', '123'))

InventoryDirectory('2325', 'wibble', parent_id='123', revision=None)

>>> i.path2id('src/wibble')

100

'2325'

101

>>> '2325' in i

102

True

103

>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))

104

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

105

>>> i['2326']

106

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

107

>>> for path, entry in i.iter_entries():

108

... print path

109

... assert i.path2id(path)

110

...

111

112

src

113

src/bye.c

114

src/hello.c

115

src/wibble

116

src/wibble/wibble.c

117

>>> i.id2path('2326')

118

'src/wibble/wibble.c'

119

"""

120

121

# Constants returned by describe_change()

122

123

# TODO: These should probably move to some kind of FileChangeDescription

124

# class; that's like what's inside a TreeDelta but we want to be able to

125

# generate them just for one file at a time.

126

RENAMED = 'renamed'

127

MODIFIED_AND_RENAMED = 'modified and renamed'

128

129

__slots__ = []

130

131

def detect_changes(self, old_entry):

132

"""Return a (text_modified, meta_modified) from this to old_entry.

133

134

_read_tree_state must have been called on self and old_entry prior to

135

calling detect_changes.

136

"""

137

return False, False

138

139

def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

140

output_to, reverse=False):

141

"""Perform a diff from this to to_entry.

142

143

text_diff will be used for textual difference calculation.

144

This is a template method, override _diff in child classes.

145

"""

146

self._read_tree_state(tree.id2path(self.file_id), tree)

147

if to_entry:

148

# cannot diff from one kind to another - you must do a removal

149

# and an addif they do not match.

150

assert self.kind == to_entry.kind

151

to_entry._read_tree_state(to_tree.id2path(to_entry.file_id),

152

to_tree)

153

self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,

154

output_to, reverse)

155

156

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

157

output_to, reverse=False):

158

"""Perform a diff between two entries of the same kind."""

159

160

def find_previous_heads(self, previous_inventories,

161

versioned_file_store,

162

transaction,

163

entry_vf=None):

164

"""Return the revisions and entries that directly precede this.

165

166

Returned as a map from revision to inventory entry.

167

168

This is a map containing the file revisions in all parents

169

for which the file exists, and its revision is not a parent of

170

any other. If the file is new, the set will be empty.

171

172

:param versioned_file_store: A store where ancestry data on this

173

file id can be queried.

174

:param transaction: The transaction that queries to the versioned

175

file store should be completed under.

176

:param entry_vf: The entry versioned file, if its already available.

177

"""

178

def get_ancestors(weave, entry):

179

return set(weave.get_ancestry(entry.revision))

180

# revision:ie mapping for each ie found in previous_inventories.

181

candidates = {}

182

# revision:ie mapping with one revision for each head.

183

heads = {}

184

# revision: ancestor list for each head

185

head_ancestors = {}

186

# identify candidate head revision ids.

187

for inv in previous_inventories:

188

if self.file_id in inv:

189

ie = inv[self.file_id]

190

assert ie.file_id == self.file_id

191

if ie.revision in candidates:

192

# same revision value in two different inventories:

193

# correct possible inconsistencies:

194

# * there was a bug in revision updates with 'x' bit

195

# support.

196

try:

197

if candidates[ie.revision].executable != ie.executable:

198

candidates[ie.revision].executable = False

199

ie.executable = False

200

except AttributeError:

201

pass

202

# must now be the same.

203

assert candidates[ie.revision] == ie

204

else:

205

# add this revision as a candidate.

206

candidates[ie.revision] = ie

207

208

# common case optimisation

209

if len(candidates) == 1:

210

# if there is only one candidate revision found

211

# then we can opening the versioned file to access ancestry:

212

# there cannot be any ancestors to eliminate when there is

213

# only one revision available.

214

heads[ie.revision] = ie

215

return heads

216

217

# eliminate ancestors amongst the available candidates:

218

# heads are those that are not an ancestor of any other candidate

219

# - this provides convergence at a per-file level.

220

for ie in candidates.values():

221

# may be an ancestor of a known head:

222

already_present = 0 != len(

223

[head for head in heads

224

if ie.revision in head_ancestors[head]])

225

if already_present:

226

# an ancestor of an analyzed candidate.

227

continue

228

# not an ancestor of a known head:

229

# load the versioned file for this file id if needed

230

if entry_vf is None:

231

entry_vf = versioned_file_store.get_weave_or_empty(

232

self.file_id, transaction)

233

ancestors = get_ancestors(entry_vf, ie)

234

# may knock something else out:

235

check_heads = list(heads.keys())

236

for head in check_heads:

237

if head in ancestors:

238

# this previously discovered 'head' is not

239

# really a head - its an ancestor of the newly

240

# found head,

241

heads.pop(head)

242

head_ancestors[ie.revision] = ancestors

243

heads[ie.revision] = ie

244

return heads

245

246

def get_tar_item(self, root, dp, now, tree):

247

"""Get a tarfile item and a file stream for its content."""

248

item = tarfile.TarInfo(pathjoin(root, dp))

249

# TODO: would be cool to actually set it to the timestamp of the

250

# revision it was last changed

251

item.mtime = now

252

fileobj = self._put_in_tar(item, tree)

253

return item, fileobj

254

255

def has_text(self):

256

"""Return true if the object this entry represents has textual data.

257

258

Note that textual data includes binary content.

259

260

Also note that all entries get weave files created for them.

261

This attribute is primarily used when upgrading from old trees that

262

did not have the weave index for all inventory entries.

263

"""

264

return False

265

266

def __init__(self, file_id, name, parent_id, text_id=None):

267

"""Create an InventoryEntry

268

269

The filename must be a single component, relative to the

270

parent directory; it cannot be a whole path or relative name.

271

272

>>> e = InventoryFile('123', 'hello.c', ROOT_ID)

273

>>> e.name

274

'hello.c'

275

>>> e.file_id

276

'123'

277

>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)

278

Traceback (most recent call last):

279

InvalidEntryName: Invalid entry name: src/hello.c

280

"""

281

assert isinstance(name, basestring), name

282

if '/' in name or '\\' in name:

283

raise InvalidEntryName(name=name)

284

self.executable = False

285

self.revision = None

286

self.text_sha1 = None

287

self.text_size = None

288

self.file_id = file_id

289

self.name = name

290

self.text_id = text_id

291

self.parent_id = parent_id

292

self.symlink_target = None

293

294

def kind_character(self):

295

"""Return a short kind indicator useful for appending to names."""

296

raise BzrError('unknown kind %r' % self.kind)

297

298

known_kinds = ('file', 'directory', 'symlink')

299

300

def _put_in_tar(self, item, tree):

301

"""populate item for stashing in a tar, and return the content stream.

302

303

If no content is available, return None.

304

"""

305

raise BzrError("don't know how to export {%s} of kind %r" %

306

(self.file_id, self.kind))

307

308

def put_on_disk(self, dest, dp, tree):

309

"""Create a representation of self on disk in the prefix dest.

310

311

This is a template method - implement _put_on_disk in subclasses.

312

"""

313

fullpath = pathjoin(dest, dp)

314

self._put_on_disk(fullpath, tree)

315

# mutter(" export {%s} kind %s to %s", self.file_id,

316

# self.kind, fullpath)

317

318

def _put_on_disk(self, fullpath, tree):

319

"""Put this entry onto disk at fullpath, from tree tree."""

320

raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))

321

322

def sorted_children(self):

323

return sorted(self.children.items())

324

325

@staticmethod

326

def versionable_kind(kind):

327

return kind in ('file', 'directory', 'symlink')

328

329

def check(self, checker, rev_id, inv, tree):

330

"""Check this inventory entry is intact.

331

332

This is a template method, override _check for kind specific

333

tests.

334

335

:param checker: Check object providing context for the checks;

336

can be used to find out what parts of the repository have already

337

been checked.

338

:param rev_id: Revision id from which this InventoryEntry was loaded.

339

Not necessarily the last-changed revision for this file.

340

:param inv: Inventory from which the entry was loaded.

341

:param tree: RevisionTree for this entry.

342

"""

343

if self.parent_id is not None:

344

if not inv.has_id(self.parent_id):

345

raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'

346

% (self.parent_id, rev_id))

347

self._check(checker, rev_id, tree)

348

349

def _check(self, checker, rev_id, tree):

350

"""Check this inventory entry for kind specific errors."""

351

raise BzrCheckError('unknown entry kind %r in revision {%s}' %

352

(self.kind, rev_id))

353

354

def copy(self):

355

"""Clone this inventory entry."""

356

raise NotImplementedError

357

358

@staticmethod

359

def describe_change(old_entry, new_entry):

360

"""Describe the change between old_entry and this.

361

362

This smells of being an InterInventoryEntry situation, but as its

363

the first one, we're making it a static method for now.

364

365

An entry with a different parent, or different name is considered

366

to be renamed. Reparenting is an internal detail.

367

Note that renaming the parent does not trigger a rename for the

368

child entry itself.

369

"""

370

# TODO: Perhaps return an object rather than just a string

371

if old_entry is new_entry:

372

# also the case of both being None

373

return 'unchanged'

374

elif old_entry is None:

375

return 'added'

376

elif new_entry is None:

377

return 'removed'

378

text_modified, meta_modified = new_entry.detect_changes(old_entry)

379

if text_modified or meta_modified:

380

modified = True

381

else:

382

modified = False

383

# TODO 20060511 (mbp, rbc) factor out 'detect_rename' here.

384

if old_entry.parent_id != new_entry.parent_id:

385

renamed = True

386

elif old_entry.name != new_entry.name:

387

renamed = True

388

else:

389

renamed = False

390

if renamed and not modified:

391

return InventoryEntry.RENAMED

392

if modified and not renamed:

393

return 'modified'

394

if modified and renamed:

395

return InventoryEntry.MODIFIED_AND_RENAMED

396

return 'unchanged'

397

398

def __repr__(self):

399

return ("%s(%r, %r, parent_id=%r, revision=%r)"

400

% (self.__class__.__name__,

401

self.file_id,

402

self.name,

403

self.parent_id,

404

self.revision))

405

406

def snapshot(self, revision, path, previous_entries,

407

work_tree, commit_builder):

408

"""Make a snapshot of this entry which may or may not have changed.

409

410

This means that all its fields are populated, that it has its

411

text stored in the text store or weave.

412

"""

413

# mutter('new parents of %s are %r', path, previous_entries)

414

self._read_tree_state(path, work_tree)

415

# TODO: Where should we determine whether to reuse a

416

# previous revision id or create a new revision? 20060606

417

if len(previous_entries) == 1:

418

# cannot be unchanged unless there is only one parent file rev.

419

parent_ie = previous_entries.values()[0]

420

if self._unchanged(parent_ie):

421

# mutter("found unchanged entry")

422

self.revision = parent_ie.revision

423

return "unchanged"

424

return self._snapshot_into_revision(revision, previous_entries,

425

work_tree, commit_builder)

426

427

def _snapshot_into_revision(self, revision, previous_entries, work_tree,

428

commit_builder):

429

"""Record this revision unconditionally into a store.

430

431

The entry's last-changed revision property (`revision`) is updated to

432

that of the new revision.

433

434

:param revision: id of the new revision that is being recorded.

435

436

:returns: String description of the commit (e.g. "merged", "modified"), etc.

437

"""

438

# mutter('new revision {%s} for {%s}', revision, self.file_id)

439

self.revision = revision

440

self._snapshot_text(previous_entries, work_tree, commit_builder)

441

442

def _snapshot_text(self, file_parents, work_tree, commit_builder):

443

"""Record the 'text' of this entry, whatever form that takes.

444

445

This default implementation simply adds an empty text.

446

"""

447

raise NotImplementedError(self._snapshot_text)

448

449

def __eq__(self, other):

450

if not isinstance(other, InventoryEntry):

451

return NotImplemented

452

453

return ((self.file_id == other.file_id)

454

and (self.name == other.name)

455

and (other.symlink_target == self.symlink_target)

456

and (self.text_sha1 == other.text_sha1)

457

and (self.text_size == other.text_size)

458

and (self.text_id == other.text_id)

459

and (self.parent_id == other.parent_id)

460

and (self.kind == other.kind)

461

and (self.revision == other.revision)

462

and (self.executable == other.executable)

463

)

464

465

def __ne__(self, other):

466

return not (self == other)

467

468

def __hash__(self):

469

raise ValueError('not hashable')

470

471

def _unchanged(self, previous_ie):

472

"""Has this entry changed relative to previous_ie.

473

474

This method should be overridden in child classes.

475

"""

476

compatible = True

477

# different inv parent

478

if previous_ie.parent_id != self.parent_id:

479

compatible = False

480

# renamed

481

elif previous_ie.name != self.name:

482

compatible = False

483

return compatible

484

485

def _read_tree_state(self, path, work_tree):

486

"""Populate fields in the inventory entry from the given tree.

487

488

Note that this should be modified to be a noop on virtual trees

489

as all entries created there are prepopulated.

490

"""

491

# TODO: Rather than running this manually, we should check the

492

# working sha1 and other expensive properties when they're

493

# first requested, or preload them if they're already known

494

pass # nothing to do by default

495

496

def _forget_tree_state(self):

497

pass

498

499

500

class InventoryDirectory(InventoryEntry):

501

"""A directory in an inventory."""

502

503

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

504

'text_id', 'parent_id', 'children', 'executable',

505

'revision', 'symlink_target']

506

507

def _check(self, checker, rev_id, tree):

508

"""See InventoryEntry._check"""

509

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

510

raise BzrCheckError('directory {%s} has text in revision {%s}'

511

% (self.file_id, rev_id))

512

513

def copy(self):

514

other = InventoryDirectory(self.file_id, self.name, self.parent_id)

515

other.revision = self.revision

516

# note that children are *not* copied; they're pulled across when

517

# others are added

518

return other

519

520

def __init__(self, file_id, name, parent_id):

521

super(InventoryDirectory, self).__init__(file_id, name, parent_id)

522

self.children = {}

523

self.kind = 'directory'

524

525

def kind_character(self):

526

"""See InventoryEntry.kind_character."""

527

return '/'

528

529

def _put_in_tar(self, item, tree):

530

"""See InventoryEntry._put_in_tar."""

531

item.type = tarfile.DIRTYPE

532

fileobj = None

533

item.name += '/'

534

item.size = 0

535

item.mode = 0755

536

return fileobj

537

538

def _put_on_disk(self, fullpath, tree):

539

"""See InventoryEntry._put_on_disk."""

540

os.mkdir(fullpath)

541

542

def _snapshot_text(self, file_parents, work_tree, commit_builder):

543

"""See InventoryEntry._snapshot_text."""

544

commit_builder.modified_directory(self.file_id, file_parents)

545

546

547

class InventoryFile(InventoryEntry):

548

"""A file in an inventory."""

549

550

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

551

'text_id', 'parent_id', 'children', 'executable',

552

'revision', 'symlink_target']

553

554

def _check(self, checker, tree_revision_id, tree):

555

"""See InventoryEntry._check"""

556

t = (self.file_id, self.revision)

557

if t in checker.checked_texts:

558

prev_sha = checker.checked_texts[t]

559

if prev_sha != self.text_sha1:

560

raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %

561

(self.file_id, tree_revision_id))

562

else:

563

checker.repeated_text_cnt += 1

564

return

565

566

if self.file_id not in checker.checked_weaves:

567

mutter('check weave {%s}', self.file_id)

568

w = tree.get_weave(self.file_id)

569

# Not passing a progress bar, because it creates a new

570

# progress, which overwrites the current progress,

571

# and doesn't look nice

572

w.check()

573

checker.checked_weaves[self.file_id] = True

574

else:

575

w = tree.get_weave(self.file_id)

576

577

mutter('check version {%s} of {%s}', tree_revision_id, self.file_id)

578

checker.checked_text_cnt += 1

579

# We can't check the length, because Weave doesn't store that

580

# information, and the whole point of looking at the weave's

581

# sha1sum is that we don't have to extract the text.

582

if self.text_sha1 != w.get_sha1(self.revision):

583

raise BzrCheckError('text {%s} version {%s} wrong sha1'

584

% (self.file_id, self.revision))

585

checker.checked_texts[t] = self.text_sha1

586

587

def copy(self):

588

other = InventoryFile(self.file_id, self.name, self.parent_id)

589

other.executable = self.executable

590

other.text_id = self.text_id

591

other.text_sha1 = self.text_sha1

592

other.text_size = self.text_size

593

other.revision = self.revision

594

return other

595

596

def detect_changes(self, old_entry):

597

"""See InventoryEntry.detect_changes."""

598

assert self.text_sha1 is not None

599

assert old_entry.text_sha1 is not None

600

text_modified = (self.text_sha1 != old_entry.text_sha1)

601

meta_modified = (self.executable != old_entry.executable)

602

return text_modified, meta_modified

603

604

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

605

output_to, reverse=False):

606

"""See InventoryEntry._diff."""

607

try:

608

from_text = tree.get_file(self.file_id).readlines()

609

if to_entry:

610

to_text = to_tree.get_file(to_entry.file_id).readlines()

611

else:

612

to_text = []

613

if not reverse:

614

text_diff(from_label, from_text,

615

to_label, to_text, output_to)

616

else:

617

text_diff(to_label, to_text,

618

from_label, from_text, output_to)

619

except BinaryFile:

620

if reverse:

621

label_pair = (to_label, from_label)

622

else:

623

label_pair = (from_label, to_label)

624

print >> output_to, "Binary files %s and %s differ" % label_pair

625

626

def has_text(self):

627

"""See InventoryEntry.has_text."""

628

return True

629

630

def __init__(self, file_id, name, parent_id):

631

super(InventoryFile, self).__init__(file_id, name, parent_id)

632

self.kind = 'file'

633

634

def kind_character(self):

635

"""See InventoryEntry.kind_character."""

636

return ''

637

638

def _put_in_tar(self, item, tree):

639

"""See InventoryEntry._put_in_tar."""

640

item.type = tarfile.REGTYPE

641

fileobj = tree.get_file(self.file_id)

642

item.size = self.text_size

643

if tree.is_executable(self.file_id):

644

item.mode = 0755

645

else:

646

item.mode = 0644

647

return fileobj

648

649

def _put_on_disk(self, fullpath, tree):

650

"""See InventoryEntry._put_on_disk."""

651

pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))

652

if tree.is_executable(self.file_id):

653

os.chmod(fullpath, 0755)

654

655

def _read_tree_state(self, path, work_tree):

656

"""See InventoryEntry._read_tree_state."""

657

self.text_sha1 = work_tree.get_file_sha1(self.file_id, path=path)

658

# FIXME: 20050930 probe for the text size when getting sha1

659

# in _read_tree_state

660

self.executable = work_tree.is_executable(self.file_id, path=path)

661

662

def __repr__(self):

663

return ("%s(%r, %r, parent_id=%r, sha1=%r, len=%s)"

664

% (self.__class__.__name__,

665

self.file_id,

666

self.name,

667

self.parent_id,

668

self.text_sha1,

669

self.text_size))

670

671

def _forget_tree_state(self):

672

self.text_sha1 = None

673

674

def _snapshot_text(self, file_parents, work_tree, commit_builder):

675

"""See InventoryEntry._snapshot_text."""

676

def get_content_byte_lines():

677

return work_tree.get_file(self.file_id).readlines()

678

self.text_sha1, self.text_size = commit_builder.modified_file_text(

679

self.file_id, file_parents, get_content_byte_lines, self.text_sha1, self.text_size)

680

681

def _unchanged(self, previous_ie):

682

"""See InventoryEntry._unchanged."""

683

compatible = super(InventoryFile, self)._unchanged(previous_ie)

684

if self.text_sha1 != previous_ie.text_sha1:

685

compatible = False

686

else:

687

# FIXME: 20050930 probe for the text size when getting sha1

688

# in _read_tree_state

689

self.text_size = previous_ie.text_size

690

if self.executable != previous_ie.executable:

691

compatible = False

692

return compatible

693

694

695

class InventoryLink(InventoryEntry):

696

"""A file in an inventory."""

697

698

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

699

'text_id', 'parent_id', 'children', 'executable',

700

'revision', 'symlink_target']

701

702

def _check(self, checker, rev_id, tree):

703

"""See InventoryEntry._check"""

704

if self.text_sha1 is not None or self.text_size is not None or self.text_id is not None:

705

raise BzrCheckError('symlink {%s} has text in revision {%s}'

706

% (self.file_id, rev_id))

707

if self.symlink_target is None:

708

raise BzrCheckError('symlink {%s} has no target in revision {%s}'

709

% (self.file_id, rev_id))

710

711

def copy(self):

712

other = InventoryLink(self.file_id, self.name, self.parent_id)

713

other.symlink_target = self.symlink_target

714

other.revision = self.revision

715

return other

716

717

def detect_changes(self, old_entry):

718

"""See InventoryEntry.detect_changes."""

719

# FIXME: which _modified field should we use ? RBC 20051003

720

text_modified = (self.symlink_target != old_entry.symlink_target)

721

if text_modified:

722

mutter(" symlink target changed")

723

meta_modified = False

724

return text_modified, meta_modified

725

726

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

727

output_to, reverse=False):

728

"""See InventoryEntry._diff."""

729

from_text = self.symlink_target

730

if to_entry is not None:

731

to_text = to_entry.symlink_target

732

if reverse:

733

temp = from_text

734

from_text = to_text

735

to_text = temp

736

print >>output_to, '=== target changed %r => %r' % (from_text, to_text)

737

else:

738

if not reverse:

739

print >>output_to, '=== target was %r' % self.symlink_target

740

else:

741

print >>output_to, '=== target is %r' % self.symlink_target

742

743

def __init__(self, file_id, name, parent_id):

744

super(InventoryLink, self).__init__(file_id, name, parent_id)

745

self.kind = 'symlink'

746

747

def kind_character(self):

748

"""See InventoryEntry.kind_character."""

749

return ''

750

751

def _put_in_tar(self, item, tree):

752

"""See InventoryEntry._put_in_tar."""

753

item.type = tarfile.SYMTYPE

754

fileobj = None

755

item.size = 0

756

item.mode = 0755

757

item.linkname = self.symlink_target

758

return fileobj

759

760

def _put_on_disk(self, fullpath, tree):

761

"""See InventoryEntry._put_on_disk."""

762

try:

763

os.symlink(self.symlink_target, fullpath)

764

except OSError,e:

765

raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))

766

767

def _read_tree_state(self, path, work_tree):

768

"""See InventoryEntry._read_tree_state."""

769

self.symlink_target = work_tree.get_symlink_target(self.file_id)

770

771

def _forget_tree_state(self):

772

self.symlink_target = None

773

774

def _unchanged(self, previous_ie):

775

"""See InventoryEntry._unchanged."""

776

compatible = super(InventoryLink, self)._unchanged(previous_ie)

777

if self.symlink_target != previous_ie.symlink_target:

778

compatible = False

779

return compatible

780

781

def _snapshot_text(self, file_parents, work_tree, commit_builder):

782

"""See InventoryEntry._snapshot_text."""

783

commit_builder.modified_link(

784

self.file_id, file_parents, self.symlink_target)

785

786

787

class Inventory(object):

788

"""Inventory of versioned files in a tree.

789

790

This describes which file_id is present at each point in the tree,

791

and possibly the SHA-1 or other information about the file.

792

Entries can be looked up either by path or by file_id.

793

794

The inventory represents a typical unix file tree, with

795

directories containing files and subdirectories. We never store

796

the full path to a file, because renaming a directory implicitly

797

moves all of its contents. This class internally maintains a

798

lookup tree that allows the children under a directory to be

799

returned quickly.

800

801

InventoryEntry objects must not be modified after they are

802

inserted, other than through the Inventory API.

803

804

>>> inv = Inventory()

805

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

806

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

807

>>> inv['123-123'].name

808

'hello.c'

809

810

May be treated as an iterator or set to look up file ids:

811

812

>>> bool(inv.path2id('hello.c'))

813

True

814

>>> '123-123' in inv

815

True

816

817

May also look up by name:

818

819

>>> [x[0] for x in inv.iter_entries()]

820

['', u'hello.c']

821

>>> inv = Inventory('TREE_ROOT-12345678-12345678')

822

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

823

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT-12345678-12345678', sha1=None, len=None)

824

"""

825

def __init__(self, root_id=ROOT_ID, revision_id=None):

826

"""Create or read an inventory.

827

828

If a working directory is specified, the inventory is read

829

from there. If the file is specified, read from that. If not,

830

the inventory is created empty.

831

832

The inventory is created with a default root directory, with

833

an id of None.

834

"""

835

# We are letting Branch.create() create a unique inventory

836

# root id. Rather than generating a random one here.

837

#if root_id is None:

838

# root_id = bzrlib.branch.gen_file_id('TREE_ROOT')

839

self.root = InventoryDirectory(root_id, '', None)

840

# FIXME: this isn't ever used, changing it to self.revision may break

841

# things. TODO make everything use self.revision_id

842

self.revision_id = revision_id

843

self._byid = {self.root.file_id: self.root}

844

845

def copy(self):

846

# TODO: jam 20051218 Should copy also copy the revision_id?

847

entries = self.iter_entries()

848

other = Inventory(entries.next()[1].file_id)

849

# copy recursively so we know directories will be added before

850

# their children. There are more efficient ways than this...

851

for path, entry in entries():

852

other.add(entry.copy())

853

return other

854

855

def __iter__(self):

856

return iter(self._byid)

857

858

def __len__(self):

859

"""Returns number of entries."""

860

return len(self._byid)

861

862

def iter_entries(self, from_dir=None):

863

"""Return (path, entry) pairs, in order by name."""

864

if from_dir is None:

865

assert self.root

866

from_dir = self.root

867

yield '', self.root

868

elif isinstance(from_dir, basestring):

869

from_dir = self._byid[from_dir]

870

871

# unrolling the recursive called changed the time from

872

# 440ms/663ms (inline/total) to 116ms/116ms

873

children = from_dir.children.items()

874

children.sort()

875

children = collections.deque(children)

876

stack = [(u'', children)]

877

while stack:

878

from_dir_relpath, children = stack[-1]

879

880

while children:

881

name, ie = children.popleft()

882

883

# we know that from_dir_relpath never ends in a slash

884

# and 'f' doesn't begin with one, we can do a string op, rather

885

# than the checks of pathjoin(), though this means that all paths

886

# start with a slash

887

path = from_dir_relpath + '/' + name

888

889

yield path[1:], ie

890

891

if ie.kind != 'directory':

892

continue

893

894

# But do this child first

895

new_children = ie.children.items()

896

new_children.sort()

897

new_children = collections.deque(new_children)

898

stack.append((path, new_children))

899

# Break out of inner loop, so that we start outer loop with child

900

break

901

else:

902

# if we finished all children, pop it off the stack

903

stack.pop()

904

905

def iter_entries_by_dir(self, from_dir=None):

906

"""Iterate over the entries in a directory first order.

907

908

This returns all entries for a directory before returning

909

the entries for children of a directory. This is not

910

lexicographically sorted order, and is a hybrid between

911

depth-first and breadth-first.

912

913

:return: This yields (path, entry) pairs

914

"""

915

# TODO? Perhaps this should return the from_dir so that the root is

916

# yielded? or maybe an option?

917

if from_dir is None:

918

assert self.root

919

from_dir = self.root

920

yield '', self.root

921

elif isinstance(from_dir, basestring):

922

from_dir = self._byid[from_dir]

923

924

stack = [(u'', from_dir)]

925

while stack:

926

cur_relpath, cur_dir = stack.pop()

927

928

child_dirs = []

929

for child_name, child_ie in sorted(cur_dir.children.iteritems()):

930

931

child_relpath = cur_relpath + child_name

932

933

yield child_relpath, child_ie

934

935

if child_ie.kind == 'directory':

936

child_dirs.append((child_relpath+'/', child_ie))

937

stack.extend(reversed(child_dirs))

938

939

def entries(self):

940

"""Return list of (path, ie) for all entries except the root.

941

942

This may be faster than iter_entries.

943

"""

944

accum = []

945

def descend(dir_ie, dir_path):

946

kids = dir_ie.children.items()

947

kids.sort()

948

for name, ie in kids:

949

child_path = pathjoin(dir_path, name)

950

accum.append((child_path, ie))

951

if ie.kind == 'directory':

952

descend(ie, child_path)

953

954

descend(self.root, u'')

955

return accum

956

957

def directories(self):

958

"""Return (path, entry) pairs for all directories, including the root.

959

"""

960

accum = []

961

def descend(parent_ie, parent_path):

962

accum.append((parent_path, parent_ie))

963

964

kids = [(ie.name, ie) for ie in parent_ie.children.itervalues() if ie.kind == 'directory']

965

kids.sort()

966

967

for name, child_ie in kids:

968

child_path = pathjoin(parent_path, name)

969

descend(child_ie, child_path)

970

descend(self.root, u'')

971

return accum

972

973

def __contains__(self, file_id):

974

"""True if this entry contains a file with given id.

975

976

>>> inv = Inventory()

977

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

978

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

979

>>> '123' in inv

980

True

981

>>> '456' in inv

982

False

983

"""

984

return file_id in self._byid

985

986

def __getitem__(self, file_id):

987

"""Return the entry for given file_id.

988

989

>>> inv = Inventory()

990

>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))

991

InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

992

>>> inv['123123'].name

993

'hello.c'

994

"""

995

try:

996

return self._byid[file_id]

997

except KeyError:

998

if file_id is None:

999

raise BzrError("can't look up file_id None")

1000

else:

1001

raise BzrError("file_id {%s} not in inventory" % file_id)

1002

1003

def get_file_kind(self, file_id):

1004

return self._byid[file_id].kind

1005

1006

def get_child(self, parent_id, filename):

1007

return self[parent_id].children.get(filename)

1008

1009

def add(self, entry):

1010

"""Add entry to inventory.

1011

1012

To add a file to a branch ready to be committed, use Branch.add,

1013

which calls this.

1014

1015

Returns the new entry object.

1016

"""

1017

if entry.file_id in self._byid:

1018

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

1019

1020

if entry.parent_id == ROOT_ID or entry.parent_id is None:

1021

entry.parent_id = self.root.file_id

1022

1023

try:

1024

parent = self._byid[entry.parent_id]

1025

except KeyError:

1026

raise BzrError("parent_id {%s} not in inventory" % entry.parent_id)

1027

1028

if entry.name in parent.children:

1029

raise BzrError("%s is already versioned" %

1030

pathjoin(self.id2path(parent.file_id), entry.name))

1031

1032

self._byid[entry.file_id] = entry

1033

parent.children[entry.name] = entry

1034

return entry

1035

1036

def add_path(self, relpath, kind, file_id=None, parent_id=None):

1037

"""Add entry from a path.

1038

1039

The immediate parent must already be versioned.

1040

1041

Returns the new entry object."""

1042

1043

parts = osutils.splitpath(relpath)

1044

1045

if len(parts) == 0:

1046

if file_id is None:

1047

file_id = bzrlib.workingtree.gen_root_id()

1048

self.root = InventoryDirectory(file_id, '', None)

1049

self._byid = {self.root.file_id: self.root}

1050

return

1051

else:

1052

parent_path = parts[:-1]

1053

parent_id = self.path2id(parent_path)

1054

if parent_id is None:

1055

raise NotVersionedError(path=parent_path)

1056

ie = make_entry(kind, parts[-1], parent_id, file_id)

1057

return self.add(ie)

1058

1059

def __delitem__(self, file_id):

1060

"""Remove entry by id.

1061

1062

>>> inv = Inventory()

1063

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1064

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

1065

>>> '123' in inv

1066

True

1067

>>> del inv['123']

1068

>>> '123' in inv

1069

False

1070

"""

1071

ie = self[file_id]

1072

1073

assert ie.parent_id is None or \

1074

self[ie.parent_id].children[ie.name] == ie

1075

1076

del self._byid[file_id]

1077

if ie.parent_id is not None:

1078

del self[ie.parent_id].children[ie.name]

1079

1080

def __eq__(self, other):

1081

"""Compare two sets by comparing their contents.

1082

1083

>>> i1 = Inventory()

1084

>>> i2 = Inventory()

1085

>>> i1 == i2

1086

True

1087

>>> i1.add(InventoryFile('123', 'foo', ROOT_ID))

1088

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

1089

>>> i1 == i2

1090

False

1091

>>> i2.add(InventoryFile('123', 'foo', ROOT_ID))

1092

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

1093

>>> i1 == i2

1094

True

1095

"""

1096

if not isinstance(other, Inventory):

1097

return NotImplemented

1098

1099

return self._byid == other._byid

1100

1101

def __ne__(self, other):

1102

return not self.__eq__(other)

1103

1104

def __hash__(self):

1105

raise ValueError('not hashable')

1106

1107

def _iter_file_id_parents(self, file_id):

1108

"""Yield the parents of file_id up to the root."""

1109

while file_id is not None:

1110

try:

1111

ie = self._byid[file_id]

1112

except KeyError:

1113

raise BzrError("file_id {%s} not found in inventory" % file_id)

1114

yield ie

1115

file_id = ie.parent_id

1116

1117

def get_idpath(self, file_id):

1118

"""Return a list of file_ids for the path to an entry.

1119

1120

The list contains one element for each directory followed by

1121

the id of the file itself. So the length of the returned list

1122

is equal to the depth of the file in the tree, counting the

1123

root directory as depth 1.

1124

"""

1125

p = []

1126

for parent in self._iter_file_id_parents(file_id):

1127

p.insert(0, parent.file_id)

1128

return p

1129

1130

def id2path(self, file_id):

1131

"""Return as a string the path to file_id.

1132

1133

>>> i = Inventory()

1134

>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))

1135

>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))

1136

>>> print i.id2path('foo-id')

1137

src/foo.c

1138

"""

1139

# get all names, skipping root

1140

return '/'.join(reversed(

1141

[parent.name for parent in

1142

self._iter_file_id_parents(file_id)][:-1]))

1143

1144

def path2id(self, name):

1145

"""Walk down through directories to return entry of last component.

1146

1147

names may be either a list of path components, or a single

1148

string, in which case it is automatically split.

1149

1150

This returns the entry of the last component in the path,

1151

which may be either a file or a directory.

1152

1153

Returns None IFF the path is not found.

1154

"""

1155

if isinstance(name, types.StringTypes):

1156

name = splitpath(name)

1157

1158

# mutter("lookup path %r" % name)

1159

1160

parent = self.root

1161

for f in name:

1162

try:

1163

cie = parent.children[f]

1164

assert cie.name == f

1165

assert cie.parent_id == parent.file_id

1166

parent = cie

1167

except KeyError:

1168

# or raise an error?

1169

return None

1170

1171

return parent.file_id

1172

1173

def has_filename(self, names):

1174

return bool(self.path2id(names))

1175

1176

def has_id(self, file_id):

1177

return self._byid.has_key(file_id)

1178

1179

def rename(self, file_id, new_parent_id, new_name):

1180

"""Move a file within the inventory.

1181

1182

This can change either the name, or the parent, or both.

1183

1184

This does not move the working file."""

1185

if not is_valid_name(new_name):

1186

raise BzrError("not an acceptable filename: %r" % new_name)

1187

1188

new_parent = self._byid[new_parent_id]

1189

if new_name in new_parent.children:

1190

raise BzrError("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

1191

1192

new_parent_idpath = self.get_idpath(new_parent_id)

1193

if file_id in new_parent_idpath:

1194

raise BzrError("cannot move directory %r into a subdirectory of itself, %r"

1195

% (self.id2path(file_id), self.id2path(new_parent_id)))

1196

1197

file_ie = self._byid[file_id]

1198

old_parent = self._byid[file_ie.parent_id]

1199

1200

# TODO: Don't leave things messed up if this fails

1201

1202

del old_parent.children[file_ie.name]

1203

new_parent.children[new_name] = file_ie

1204

1205

file_ie.name = new_name

1206

file_ie.parent_id = new_parent_id

1207

1208

def is_root(self, file_id):

1209

return self.root is not None and file_id == self.root.file_id

1210

1211

1212

def make_entry(kind, name, parent_id, file_id=None):

1213

"""Create an inventory entry.

1214

1215

:param kind: the type of inventory entry to create.

1216

:param name: the basename of the entry.

1217

:param parent_id: the parent_id of the entry.

1218

:param file_id: the file_id to use. if None, one will be created.

1219

"""

1220

if file_id is None:

1221

file_id = bzrlib.workingtree.gen_file_id(name)

1222

1223

norm_name, can_access = osutils.normalized_filename(name)

1224

if norm_name != name:

1225

if can_access:

1226

name = norm_name

1227

else:

1228

# TODO: jam 20060701 This would probably be more useful

1229

# if the error was raised with the full path

1230

raise errors.InvalidNormalization(name)

1231

1232

if kind == 'directory':

1233

return InventoryDirectory(file_id, name, parent_id)

1234

elif kind == 'file':

1235

return InventoryFile(file_id, name, parent_id)

1236

elif kind == 'symlink':

1237

return InventoryLink(file_id, name, parent_id)

1238

else:

1239

raise BzrError("unknown kind %r" % kind)

1240

1241

1242

_NAME_RE = None

1243

1244

def is_valid_name(name):

1245

global _NAME_RE

1246

if _NAME_RE is None:

1247

_NAME_RE = re.compile(r'^[^/\\]+$')

1248

1249

return bool(_NAME_RE.match(name))

Older »