/brz/remove-bazaar : revision 1733.1.7

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: Jelmer Vernooij
Date: 2006-06-13 15:04:06 UTC
mto: (1769.1.1 integration)
mto: This revision was merged to the branch mainline in revision 1770.
Revision ID: jelmer@samba.org-20060613150406-fb8b663191b0bd2a

Change set of control dir formats to list.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/read_bundle.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v07.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

generate_docs.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: This refactoring of the workingtree code doesn't seem to keep

# the WorkingTree's copy of the inventory in sync with the branch. The

# branch modifies its working inventory when it does a commit to make

# missing files permanently removed.

# TODO: Maybe also keep the full path of the entry, and the children?

# But those depend on its position within a particular inventory, and

# it would be nice not to need to hold the backpointer here.

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import collections

import os.path

import re

import sys

import tarfile

import types

import bzrlib

from bzrlib.osutils import (pumpfile, quotefn, splitpath, joinpath,

pathjoin, sha_strings)

from bzrlib.errors import (NotVersionedError, InvalidEntryName,

BzrError, BzrCheckError, BinaryFile)

from bzrlib.trace import mutter

class InventoryEntry(object):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

file_id

name

(within the parent directory)

parent_id

file_id of the parent directory, or ROOT_ID

revision

the revision_id in which this variation of this file was

introduced.

executable

Indicates that this file should be executable on systems

that support it.

text_sha1

sha-1 of the text of the file

text_size

size in bytes of the text of the file

(reading a version 4 tree created a text_id field.)

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))

InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None)

>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))

InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None)

>>> shouldbe = {0: 'src', 1: pathjoin('src','hello.c')}

>>> for ix, j in enumerate(i.iter_entries()):

... print (j[0] == shouldbe[ix], j[1])

...

(True, InventoryDirectory('123', 'src', parent_id='TREE_ROOT', revision=None))

(True, InventoryFile('2323', 'hello.c', parent_id='123', sha1=None, len=None))

>>> i.add(InventoryFile('2323', 'bye.c', '123'))

Traceback (most recent call last):

...

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryFile('2324', 'bye.c', '123'))

InventoryFile('2324', 'bye.c', parent_id='123', sha1=None, len=None)

>>> i.add(InventoryDirectory('2325', 'wibble', '123'))

InventoryDirectory('2325', 'wibble', parent_id='123', revision=None)

>>> i.path2id('src/wibble')

'2325'

>>> '2325' in i

100

True

101

>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))

102

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

103

>>> i['2326']

104

InventoryFile('2326', 'wibble.c', parent_id='2325', sha1=None, len=None)

105

>>> for path, entry in i.iter_entries():

106

... print path

107

... assert i.path2id(path)

108

...

109

src

110

src/bye.c

111

src/hello.c

112

src/wibble

113

src/wibble/wibble.c

114

>>> i.id2path('2326')

115

'src/wibble/wibble.c'

116

"""

117

118

# Constants returned by describe_change()

119

120

# TODO: These should probably move to some kind of FileChangeDescription

121

# class; that's like what's inside a TreeDelta but we want to be able to

122

# generate them just for one file at a time.

123

RENAMED = 'renamed'

124

MODIFIED_AND_RENAMED = 'modified and renamed'

125

126

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

127

'text_id', 'parent_id', 'children', 'executable',

128

'revision']

129

130

def detect_changes(self, old_entry):

131

"""Return a (text_modified, meta_modified) from this to old_entry.

132

133

_read_tree_state must have been called on self and old_entry prior to

134

calling detect_changes.

135

"""

136

return False, False

137

138

def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

139

output_to, reverse=False):

140

"""Perform a diff from this to to_entry.

141

142

text_diff will be used for textual difference calculation.

143

This is a template method, override _diff in child classes.

144

"""

145

self._read_tree_state(tree.id2path(self.file_id), tree)

146

if to_entry:

147

# cannot diff from one kind to another - you must do a removal

148

# and an addif they do not match.

149

assert self.kind == to_entry.kind

150

to_entry._read_tree_state(to_tree.id2path(to_entry.file_id),

151

to_tree)

152

self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,

153

output_to, reverse)

154

155

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

156

output_to, reverse=False):

157

"""Perform a diff between two entries of the same kind."""

158

159

def find_previous_heads(self, previous_inventories,

160

versioned_file_store,

161

transaction,

162

entry_vf=None):

163

"""Return the revisions and entries that directly precede this.

164

165

Returned as a map from revision to inventory entry.

166

167

This is a map containing the file revisions in all parents

168

for which the file exists, and its revision is not a parent of

169

any other. If the file is new, the set will be empty.

170

171

:param versioned_file_store: A store where ancestry data on this

172

file id can be queried.

173

:param transaction: The transaction that queries to the versioned

174

file store should be completed under.

175

:param entry_vf: The entry versioned file, if its already available.

176

"""

177

def get_ancestors(weave, entry):

178

return set(weave.get_ancestry(entry.revision))

179

# revision:ie mapping for each ie found in previous_inventories.

180

candidates = {}

181

# revision:ie mapping with one revision for each head.

182

heads = {}

183

# revision: ancestor list for each head

184

head_ancestors = {}

185

# identify candidate head revision ids.

186

for inv in previous_inventories:

187

if self.file_id in inv:

188

ie = inv[self.file_id]

189

assert ie.file_id == self.file_id

190

if ie.revision in candidates:

191

# same revision value in two different inventories:

192

# correct possible inconsistencies:

193

# * there was a bug in revision updates with 'x' bit

194

# support.

195

try:

196

if candidates[ie.revision].executable != ie.executable:

197

candidates[ie.revision].executable = False

198

ie.executable = False

199

except AttributeError:

200

pass

201

# must now be the same.

202

assert candidates[ie.revision] == ie

203

else:

204

# add this revision as a candidate.

205

candidates[ie.revision] = ie

206

207

# common case optimisation

208

if len(candidates) == 1:

209

# if there is only one candidate revision found

210

# then we can opening the versioned file to access ancestry:

211

# there cannot be any ancestors to eliminate when there is

212

# only one revision available.

213

heads[ie.revision] = ie

214

return heads

215

216

# eliminate ancestors amongst the available candidates:

217

# heads are those that are not an ancestor of any other candidate

218

# - this provides convergence at a per-file level.

219

for ie in candidates.values():

220

# may be an ancestor of a known head:

221

already_present = 0 != len(

222

[head for head in heads

223

if ie.revision in head_ancestors[head]])

224

if already_present:

225

# an ancestor of an analyzed candidate.

226

continue

227

# not an ancestor of a known head:

228

# load the versioned file for this file id if needed

229

if entry_vf is None:

230

entry_vf = versioned_file_store.get_weave_or_empty(

231

self.file_id, transaction)

232

ancestors = get_ancestors(entry_vf, ie)

233

# may knock something else out:

234

check_heads = list(heads.keys())

235

for head in check_heads:

236

if head in ancestors:

237

# this previously discovered 'head' is not

238

# really a head - its an ancestor of the newly

239

# found head,

240

heads.pop(head)

241

head_ancestors[ie.revision] = ancestors

242

heads[ie.revision] = ie

243

return heads

244

245

def get_tar_item(self, root, dp, now, tree):

246

"""Get a tarfile item and a file stream for its content."""

247

item = tarfile.TarInfo(pathjoin(root, dp))

248

# TODO: would be cool to actually set it to the timestamp of the

249

# revision it was last changed

250

item.mtime = now

251

fileobj = self._put_in_tar(item, tree)

252

return item, fileobj

253

254

def has_text(self):

255

"""Return true if the object this entry represents has textual data.

256

257

Note that textual data includes binary content.

258

259

Also note that all entries get weave files created for them.

260

This attribute is primarily used when upgrading from old trees that

261

did not have the weave index for all inventory entries.

262

"""

263

return False

264

265

def __init__(self, file_id, name, parent_id, text_id=None):

266

"""Create an InventoryEntry

267

268

The filename must be a single component, relative to the

269

parent directory; it cannot be a whole path or relative name.

270

271

>>> e = InventoryFile('123', 'hello.c', ROOT_ID)

272

>>> e.name

273

'hello.c'

274

>>> e.file_id

275

'123'

276

>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)

277

Traceback (most recent call last):

278

InvalidEntryName: Invalid entry name: src/hello.c

279

"""

280

assert isinstance(name, basestring), name

281

if '/' in name or '\\' in name:

282

raise InvalidEntryName(name=name)

283

self.executable = False

284

self.revision = None

285

self.text_sha1 = None

286

self.text_size = None

287

self.file_id = file_id

288

self.name = name

289

self.text_id = text_id

290

self.parent_id = parent_id

291

self.symlink_target = None

292

293

def kind_character(self):

294

"""Return a short kind indicator useful for appending to names."""

295

raise BzrError('unknown kind %r' % self.kind)

296

297

known_kinds = ('file', 'directory', 'symlink', 'root_directory')

298

299

def _put_in_tar(self, item, tree):

300

"""populate item for stashing in a tar, and return the content stream.

301

302

If no content is available, return None.

303

"""

304

raise BzrError("don't know how to export {%s} of kind %r" %

305

(self.file_id, self.kind))

306

307

def put_on_disk(self, dest, dp, tree):

308

"""Create a representation of self on disk in the prefix dest.

309

310

This is a template method - implement _put_on_disk in subclasses.

311

"""

312

fullpath = pathjoin(dest, dp)

313

self._put_on_disk(fullpath, tree)

314

mutter(" export {%s} kind %s to %s", self.file_id,

315

self.kind, fullpath)

316

317

def _put_on_disk(self, fullpath, tree):

318

"""Put this entry onto disk at fullpath, from tree tree."""

319

raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))

320

321

def sorted_children(self):

322

l = self.children.items()

323

l.sort()

324

return l

325

326

@staticmethod

327

def versionable_kind(kind):

328

return kind in ('file', 'directory', 'symlink')

329

330

def check(self, checker, rev_id, inv, tree):

331

"""Check this inventory entry is intact.

332

333

This is a template method, override _check for kind specific

334

tests.

335

336

:param checker: Check object providing context for the checks;

337

can be used to find out what parts of the repository have already

338

been checked.

339

:param rev_id: Revision id from which this InventoryEntry was loaded.

340

Not necessarily the last-changed revision for this file.

341

:param inv: Inventory from which the entry was loaded.

342

:param tree: RevisionTree for this entry.

343

"""

344

if self.parent_id != None:

345

if not inv.has_id(self.parent_id):

346

raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'

347

% (self.parent_id, rev_id))

348

self._check(checker, rev_id, tree)

349

350

def _check(self, checker, rev_id, tree):

351

"""Check this inventory entry for kind specific errors."""

352

raise BzrCheckError('unknown entry kind %r in revision {%s}' %

353

(self.kind, rev_id))

354

355

def copy(self):

356

"""Clone this inventory entry."""

357

raise NotImplementedError

358

359

@staticmethod

360

def describe_change(old_entry, new_entry):

361

"""Describe the change between old_entry and this.

362

363

This smells of being an InterInventoryEntry situation, but as its

364

the first one, we're making it a static method for now.

365

366

An entry with a different parent, or different name is considered

367

to be renamed. Reparenting is an internal detail.

368

Note that renaming the parent does not trigger a rename for the

369

child entry itself.

370

"""

371

# TODO: Perhaps return an object rather than just a string

372

if old_entry is new_entry:

373

# also the case of both being None

374

return 'unchanged'

375

elif old_entry is None:

376

return 'added'

377

elif new_entry is None:

378

return 'removed'

379

text_modified, meta_modified = new_entry.detect_changes(old_entry)

380

if text_modified or meta_modified:

381

modified = True

382

else:

383

modified = False

384

# TODO 20060511 (mbp, rbc) factor out 'detect_rename' here.

385

if old_entry.parent_id != new_entry.parent_id:

386

renamed = True

387

elif old_entry.name != new_entry.name:

388

renamed = True

389

else:

390

renamed = False

391

if renamed and not modified:

392

return InventoryEntry.RENAMED

393

if modified and not renamed:

394

return 'modified'

395

if modified and renamed:

396

return InventoryEntry.MODIFIED_AND_RENAMED

397

return 'unchanged'

398

399

def __repr__(self):

400

return ("%s(%r, %r, parent_id=%r, revision=%r)"

401

% (self.__class__.__name__,

402

self.file_id,

403

self.name,

404

self.parent_id,

405

self.revision))

406

407

def snapshot(self, revision, path, previous_entries,

408

work_tree, commit_builder):

409

"""Make a snapshot of this entry which may or may not have changed.

410

411

This means that all its fields are populated, that it has its

412

text stored in the text store or weave.

413

"""

414

mutter('new parents of %s are %r', path, previous_entries)

415

self._read_tree_state(path, work_tree)

416

# TODO: Where should we determine whether to reuse a

417

# previous revision id or create a new revision? 20060606

418

if len(previous_entries) == 1:

419

# cannot be unchanged unless there is only one parent file rev.

420

parent_ie = previous_entries.values()[0]

421

if self._unchanged(parent_ie):

422

mutter("found unchanged entry")

423

self.revision = parent_ie.revision

424

return "unchanged"

425

return self._snapshot_into_revision(revision, previous_entries,

426

work_tree, commit_builder)

427

428

def _snapshot_into_revision(self, revision, previous_entries, work_tree,

429

commit_builder):

430

"""Record this revision unconditionally into a store.

431

432

The entry's last-changed revision property (`revision`) is updated to

433

that of the new revision.

434

435

:param revision: id of the new revision that is being recorded.

436

437

:returns: String description of the commit (e.g. "merged", "modified"), etc.

438

"""

439

mutter('new revision {%s} for {%s}', revision, self.file_id)

440

self.revision = revision

441

self._snapshot_text(previous_entries, work_tree, commit_builder)

442

443

def _snapshot_text(self, file_parents, work_tree, commit_builder):

444

"""Record the 'text' of this entry, whatever form that takes.

445

446

This default implementation simply adds an empty text.

447

"""

448

raise NotImplementedError(self._snapshot_text)

449

450

def __eq__(self, other):

451

if not isinstance(other, InventoryEntry):

452

return NotImplemented

453

454

return ((self.file_id == other.file_id)

455

and (self.name == other.name)

456

and (other.symlink_target == self.symlink_target)

457

and (self.text_sha1 == other.text_sha1)

458

and (self.text_size == other.text_size)

459

and (self.text_id == other.text_id)

460

and (self.parent_id == other.parent_id)

461

and (self.kind == other.kind)

462

and (self.revision == other.revision)

463

and (self.executable == other.executable)

464

)

465

466

def __ne__(self, other):

467

return not (self == other)

468

469

def __hash__(self):

470

raise ValueError('not hashable')

471

472

def _unchanged(self, previous_ie):

473

"""Has this entry changed relative to previous_ie.

474

475

This method should be overridden in child classes.

476

"""

477

compatible = True

478

# different inv parent

479

if previous_ie.parent_id != self.parent_id:

480

compatible = False

481

# renamed

482

elif previous_ie.name != self.name:

483

compatible = False

484

return compatible

485

486

def _read_tree_state(self, path, work_tree):

487

"""Populate fields in the inventory entry from the given tree.

488

489

Note that this should be modified to be a noop on virtual trees

490

as all entries created there are prepopulated.

491

"""

492

# TODO: Rather than running this manually, we should check the

493

# working sha1 and other expensive properties when they're

494

# first requested, or preload them if they're already known

495

pass # nothing to do by default

496

497

def _forget_tree_state(self):

498

pass

499

500

501

class RootEntry(InventoryEntry):

502

503

def _check(self, checker, rev_id, tree):

504

"""See InventoryEntry._check"""

505

506

def __init__(self, file_id):

507

self.file_id = file_id

508

self.children = {}

509

self.kind = 'root_directory'

510

self.parent_id = None

511

self.name = u''

512

self.revision = None

513

514

def __eq__(self, other):

515

if not isinstance(other, RootEntry):

516

return NotImplemented

517

518

return (self.file_id == other.file_id) \

519

and (self.children == other.children)

520

521

522

class InventoryDirectory(InventoryEntry):

523

"""A directory in an inventory."""

524

525

def _check(self, checker, rev_id, tree):

526

"""See InventoryEntry._check"""

527

if self.text_sha1 != None or self.text_size != None or self.text_id != None:

528

raise BzrCheckError('directory {%s} has text in revision {%s}'

529

% (self.file_id, rev_id))

530

531

def copy(self):

532

other = InventoryDirectory(self.file_id, self.name, self.parent_id)

533

other.revision = self.revision

534

# note that children are *not* copied; they're pulled across when

535

# others are added

536

return other

537

538

def __init__(self, file_id, name, parent_id):

539

super(InventoryDirectory, self).__init__(file_id, name, parent_id)

540

self.children = {}

541

self.kind = 'directory'

542

543

def kind_character(self):

544

"""See InventoryEntry.kind_character."""

545

return '/'

546

547

def _put_in_tar(self, item, tree):

548

"""See InventoryEntry._put_in_tar."""

549

item.type = tarfile.DIRTYPE

550

fileobj = None

551

item.name += '/'

552

item.size = 0

553

item.mode = 0755

554

return fileobj

555

556

def _put_on_disk(self, fullpath, tree):

557

"""See InventoryEntry._put_on_disk."""

558

os.mkdir(fullpath)

559

560

def _snapshot_text(self, file_parents, work_tree, commit_builder):

561

"""See InventoryEntry._snapshot_text."""

562

commit_builder.modified_directory(self.file_id, file_parents)

563

564

565

class InventoryFile(InventoryEntry):

566

"""A file in an inventory."""

567

568

def _check(self, checker, tree_revision_id, tree):

569

"""See InventoryEntry._check"""

570

t = (self.file_id, self.revision)

571

if t in checker.checked_texts:

572

prev_sha = checker.checked_texts[t]

573

if prev_sha != self.text_sha1:

574

raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %

575

(self.file_id, tree_revision_id))

576

else:

577

checker.repeated_text_cnt += 1

578

return

579

580

if self.file_id not in checker.checked_weaves:

581

mutter('check weave {%s}', self.file_id)

582

w = tree.get_weave(self.file_id)

583

# Not passing a progress bar, because it creates a new

584

# progress, which overwrites the current progress,

585

# and doesn't look nice

586

w.check()

587

checker.checked_weaves[self.file_id] = True

588

else:

589

w = tree.get_weave(self.file_id)

590

591

mutter('check version {%s} of {%s}', tree_revision_id, self.file_id)

592

checker.checked_text_cnt += 1

593

# We can't check the length, because Weave doesn't store that

594

# information, and the whole point of looking at the weave's

595

# sha1sum is that we don't have to extract the text.

596

if self.text_sha1 != w.get_sha1(self.revision):

597

raise BzrCheckError('text {%s} version {%s} wrong sha1'

598

% (self.file_id, self.revision))

599

checker.checked_texts[t] = self.text_sha1

600

601

def copy(self):

602

other = InventoryFile(self.file_id, self.name, self.parent_id)

603

other.executable = self.executable

604

other.text_id = self.text_id

605

other.text_sha1 = self.text_sha1

606

other.text_size = self.text_size

607

other.revision = self.revision

608

return other

609

610

def detect_changes(self, old_entry):

611

"""See InventoryEntry.detect_changes."""

612

assert self.text_sha1 != None

613

assert old_entry.text_sha1 != None

614

text_modified = (self.text_sha1 != old_entry.text_sha1)

615

meta_modified = (self.executable != old_entry.executable)

616

return text_modified, meta_modified

617

618

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

619

output_to, reverse=False):

620

"""See InventoryEntry._diff."""

621

try:

622

from_text = tree.get_file(self.file_id).readlines()

623

if to_entry:

624

to_text = to_tree.get_file(to_entry.file_id).readlines()

625

else:

626

to_text = []

627

if not reverse:

628

text_diff(from_label, from_text,

629

to_label, to_text, output_to)

630

else:

631

text_diff(to_label, to_text,

632

from_label, from_text, output_to)

633

except BinaryFile:

634

if reverse:

635

label_pair = (to_label, from_label)

636

else:

637

label_pair = (from_label, to_label)

638

print >> output_to, "Binary files %s and %s differ" % label_pair

639

640

def has_text(self):

641

"""See InventoryEntry.has_text."""

642

return True

643

644

def __init__(self, file_id, name, parent_id):

645

super(InventoryFile, self).__init__(file_id, name, parent_id)

646

self.kind = 'file'

647

648

def kind_character(self):

649

"""See InventoryEntry.kind_character."""

650

return ''

651

652

def _put_in_tar(self, item, tree):

653

"""See InventoryEntry._put_in_tar."""

654

item.type = tarfile.REGTYPE

655

fileobj = tree.get_file(self.file_id)

656

item.size = self.text_size

657

if tree.is_executable(self.file_id):

658

item.mode = 0755

659

else:

660

item.mode = 0644

661

return fileobj

662

663

def _put_on_disk(self, fullpath, tree):

664

"""See InventoryEntry._put_on_disk."""

665

pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))

666

if tree.is_executable(self.file_id):

667

os.chmod(fullpath, 0755)

668

669

def _read_tree_state(self, path, work_tree):

670

"""See InventoryEntry._read_tree_state."""

671

self.text_sha1 = work_tree.get_file_sha1(self.file_id, path=path)

672

# FIXME: 20050930 probe for the text size when getting sha1

673

# in _read_tree_state

674

self.executable = work_tree.is_executable(self.file_id, path=path)

675

676

def __repr__(self):

677

return ("%s(%r, %r, parent_id=%r, sha1=%r, len=%s)"

678

% (self.__class__.__name__,

679

self.file_id,

680

self.name,

681

self.parent_id,

682

self.text_sha1,

683

self.text_size))

684

685

def _forget_tree_state(self):

686

self.text_sha1 = None

687

self.executable = None

688

689

def _snapshot_text(self, file_parents, work_tree, commit_builder):

690

"""See InventoryEntry._snapshot_text."""

691

def get_content_byte_lines():

692

return work_tree.get_file(self.file_id).readlines()

693

self.text_sha1, self.text_size = commit_builder.modified_file_text(

694

self.file_id, file_parents, get_content_byte_lines, self.text_sha1, self.text_size)

695

696

def _unchanged(self, previous_ie):

697

"""See InventoryEntry._unchanged."""

698

compatible = super(InventoryFile, self)._unchanged(previous_ie)

699

if self.text_sha1 != previous_ie.text_sha1:

700

compatible = False

701

else:

702

# FIXME: 20050930 probe for the text size when getting sha1

703

# in _read_tree_state

704

self.text_size = previous_ie.text_size

705

if self.executable != previous_ie.executable:

706

compatible = False

707

return compatible

708

709

710

class InventoryLink(InventoryEntry):

711

"""A file in an inventory."""

712

713

__slots__ = ['symlink_target']

714

715

def _check(self, checker, rev_id, tree):

716

"""See InventoryEntry._check"""

717

if self.text_sha1 != None or self.text_size != None or self.text_id != None:

718

raise BzrCheckError('symlink {%s} has text in revision {%s}'

719

% (self.file_id, rev_id))

720

if self.symlink_target is None:

721

raise BzrCheckError('symlink {%s} has no target in revision {%s}'

722

% (self.file_id, rev_id))

723

724

def copy(self):

725

other = InventoryLink(self.file_id, self.name, self.parent_id)

726

other.symlink_target = self.symlink_target

727

other.revision = self.revision

728

return other

729

730

def detect_changes(self, old_entry):

731

"""See InventoryEntry.detect_changes."""

732

# FIXME: which _modified field should we use ? RBC 20051003

733

text_modified = (self.symlink_target != old_entry.symlink_target)

734

if text_modified:

735

mutter(" symlink target changed")

736

meta_modified = False

737

return text_modified, meta_modified

738

739

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

740

output_to, reverse=False):

741

"""See InventoryEntry._diff."""

742

from_text = self.symlink_target

743

if to_entry is not None:

744

to_text = to_entry.symlink_target

745

if reverse:

746

temp = from_text

747

from_text = to_text

748

to_text = temp

749

print >>output_to, '=== target changed %r => %r' % (from_text, to_text)

750

else:

751

if not reverse:

752

print >>output_to, '=== target was %r' % self.symlink_target

753

else:

754

print >>output_to, '=== target is %r' % self.symlink_target

755

756

def __init__(self, file_id, name, parent_id):

757

super(InventoryLink, self).__init__(file_id, name, parent_id)

758

self.kind = 'symlink'

759

760

def kind_character(self):

761

"""See InventoryEntry.kind_character."""

762

return ''

763

764

def _put_in_tar(self, item, tree):

765

"""See InventoryEntry._put_in_tar."""

766

item.type = tarfile.SYMTYPE

767

fileobj = None

768

item.size = 0

769

item.mode = 0755

770

item.linkname = self.symlink_target

771

return fileobj

772

773

def _put_on_disk(self, fullpath, tree):

774

"""See InventoryEntry._put_on_disk."""

775

try:

776

os.symlink(self.symlink_target, fullpath)

777

except OSError,e:

778

raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))

779

780

def _read_tree_state(self, path, work_tree):

781

"""See InventoryEntry._read_tree_state."""

782

self.symlink_target = work_tree.get_symlink_target(self.file_id)

783

784

def _forget_tree_state(self):

785

self.symlink_target = None

786

787

def _unchanged(self, previous_ie):

788

"""See InventoryEntry._unchanged."""

789

compatible = super(InventoryLink, self)._unchanged(previous_ie)

790

if self.symlink_target != previous_ie.symlink_target:

791

compatible = False

792

return compatible

793

794

def _snapshot_text(self, file_parents, work_tree, commit_builder):

795

"""See InventoryEntry._snapshot_text."""

796

commit_builder.modified_link(

797

self.file_id, file_parents, self.symlink_target)

798

799

800

class Inventory(object):

801

"""Inventory of versioned files in a tree.

802

803

This describes which file_id is present at each point in the tree,

804

and possibly the SHA-1 or other information about the file.

805

Entries can be looked up either by path or by file_id.

806

807

The inventory represents a typical unix file tree, with

808

directories containing files and subdirectories. We never store

809

the full path to a file, because renaming a directory implicitly

810

moves all of its contents. This class internally maintains a

811

lookup tree that allows the children under a directory to be

812

returned quickly.

813

814

InventoryEntry objects must not be modified after they are

815

inserted, other than through the Inventory API.

816

817

>>> inv = Inventory()

818

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

819

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

820

>>> inv['123-123'].name

821

'hello.c'

822

823

May be treated as an iterator or set to look up file ids:

824

825

>>> bool(inv.path2id('hello.c'))

826

True

827

>>> '123-123' in inv

828

True

829

830

May also look up by name:

831

832

>>> [x[0] for x in inv.iter_entries()]

833

[u'hello.c']

834

>>> inv = Inventory('TREE_ROOT-12345678-12345678')

835

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

836

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT-12345678-12345678', sha1=None, len=None)

837

"""

838

def __init__(self, root_id=ROOT_ID, revision_id=None):

839

"""Create or read an inventory.

840

841

If a working directory is specified, the inventory is read

842

from there. If the file is specified, read from that. If not,

843

the inventory is created empty.

844

845

The inventory is created with a default root directory, with

846

an id of None.

847

"""

848

# We are letting Branch.create() create a unique inventory

849

# root id. Rather than generating a random one here.

850

#if root_id is None:

851

# root_id = bzrlib.branch.gen_file_id('TREE_ROOT')

852

self.root = RootEntry(root_id)

853

# FIXME: this isn't ever used, changing it to self.revision may break

854

# things. TODO make everything use self.revision_id

855

self.revision_id = revision_id

856

self._byid = {self.root.file_id: self.root}

857

858

def copy(self):

859

# TODO: jam 20051218 Should copy also copy the revision_id?

860

other = Inventory(self.root.file_id)

861

# copy recursively so we know directories will be added before

862

# their children. There are more efficient ways than this...

863

for path, entry in self.iter_entries():

864

if entry == self.root:

865

continue

866

other.add(entry.copy())

867

return other

868

869

def __iter__(self):

870

return iter(self._byid)

871

872

def __len__(self):

873

"""Returns number of entries."""

874

return len(self._byid)

875

876

def iter_entries(self, from_dir=None):

877

"""Return (path, entry) pairs, in order by name."""

878

if from_dir is None:

879

assert self.root

880

from_dir = self.root

881

elif isinstance(from_dir, basestring):

882

from_dir = self._byid[from_dir]

883

884

# unrolling the recursive called changed the time from

885

# 440ms/663ms (inline/total) to 116ms/116ms

886

children = from_dir.children.items()

887

children.sort()

888

children = collections.deque(children)

889

stack = [(u'', children)]

890

while stack:

891

from_dir_relpath, children = stack[-1]

892

893

while children:

894

name, ie = children.popleft()

895

896

# we know that from_dir_relpath never ends in a slash

897

# and 'f' doesn't begin with one, we can do a string op, rather

898

# than the checks of pathjoin(), though this means that all paths

899

# start with a slash

900

path = from_dir_relpath + '/' + name

901

902

yield path[1:], ie

903

904

if ie.kind != 'directory':

905

continue

906

907

# But do this child first

908

new_children = ie.children.items()

909

new_children.sort()

910

new_children = collections.deque(new_children)

911

stack.append((path, new_children))

912

# Break out of inner loop, so that we start outer loop with child

913

break

914

else:

915

# if we finished all children, pop it off the stack

916

stack.pop()

917

918

def iter_entries_by_dir(self, from_dir=None):

919

"""Iterate over the entries in a directory first order.

920

921

This returns all entries for a directory before returning

922

the entries for children of a directory. This is not

923

lexicographically sorted order, and is a hybrid between

924

depth-first and breadth-first.

925

926

:return: This yields (path, entry) pairs

927

"""

928

# TODO? Perhaps this should return the from_dir so that the root is

929

# yielded? or maybe an option?

930

if from_dir is None:

931

assert self.root

932

from_dir = self.root

933

elif isinstance(from_dir, basestring):

934

from_dir = self._byid[from_dir]

935

936

stack = [(u'', from_dir)]

937

while stack:

938

cur_relpath, cur_dir = stack.pop()

939

940

child_dirs = []

941

for child_name, child_ie in sorted(cur_dir.children.iteritems()):

942

943

child_relpath = cur_relpath + child_name

944

945

yield child_relpath, child_ie

946

947

if child_ie.kind == 'directory':

948

child_dirs.append((child_relpath+'/', child_ie))

949

stack.extend(reversed(child_dirs))

950

951

def entries(self):

952

"""Return list of (path, ie) for all entries except the root.

953

954

This may be faster than iter_entries.

955

"""

956

accum = []

957

def descend(dir_ie, dir_path):

958

kids = dir_ie.children.items()

959

kids.sort()

960

for name, ie in kids:

961

child_path = pathjoin(dir_path, name)

962

accum.append((child_path, ie))

963

if ie.kind == 'directory':

964

descend(ie, child_path)

965

966

descend(self.root, u'')

967

return accum

968

969

def directories(self):

970

"""Return (path, entry) pairs for all directories, including the root.

971

"""

972

accum = []

973

def descend(parent_ie, parent_path):

974

accum.append((parent_path, parent_ie))

975

976

kids = [(ie.name, ie) for ie in parent_ie.children.itervalues() if ie.kind == 'directory']

977

kids.sort()

978

979

for name, child_ie in kids:

980

child_path = pathjoin(parent_path, name)

981

descend(child_ie, child_path)

982

descend(self.root, u'')

983

return accum

984

985

def __contains__(self, file_id):

986

"""True if this entry contains a file with given id.

987

988

>>> inv = Inventory()

989

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

990

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

991

>>> '123' in inv

992

True

993

>>> '456' in inv

994

False

995

"""

996

return file_id in self._byid

997

998

def __getitem__(self, file_id):

999

"""Return the entry for given file_id.

1000

1001

>>> inv = Inventory()

1002

>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))

1003

InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)

1004

>>> inv['123123'].name

1005

'hello.c'

1006

"""

1007

try:

1008

return self._byid[file_id]

1009

except KeyError:

1010

if file_id is None:

1011

raise BzrError("can't look up file_id None")

1012

else:

1013

raise BzrError("file_id {%s} not in inventory" % file_id)

1014

1015

def get_file_kind(self, file_id):

1016

return self._byid[file_id].kind

1017

1018

def get_child(self, parent_id, filename):

1019

return self[parent_id].children.get(filename)

1020

1021

def add(self, entry):

1022

"""Add entry to inventory.

1023

1024

To add a file to a branch ready to be committed, use Branch.add,

1025

which calls this.

1026

1027

Returns the new entry object.

1028

"""

1029

if entry.file_id in self._byid:

1030

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

1031

1032

if entry.parent_id == ROOT_ID or entry.parent_id is None:

1033

entry.parent_id = self.root.file_id

1034

1035

try:

1036

parent = self._byid[entry.parent_id]

1037

except KeyError:

1038

raise BzrError("parent_id {%s} not in inventory" % entry.parent_id)

1039

1040

if parent.children.has_key(entry.name):

1041

raise BzrError("%s is already versioned" %

1042

pathjoin(self.id2path(parent.file_id), entry.name))

1043

1044

self._byid[entry.file_id] = entry

1045

parent.children[entry.name] = entry

1046

return entry

1047

1048

def add_path(self, relpath, kind, file_id=None, parent_id=None):

1049

"""Add entry from a path.

1050

1051

The immediate parent must already be versioned.

1052

1053

Returns the new entry object."""

1054

1055

parts = bzrlib.osutils.splitpath(relpath)

1056

1057

if len(parts) == 0:

1058

if file_id is None:

1059

file_id = bzrlib.workingtree.gen_root_id()

1060

self.root = RootEntry(file_id)

1061

self._byid = {self.root.file_id: self.root}

1062

return

1063

else:

1064

parent_path = parts[:-1]

1065

parent_id = self.path2id(parent_path)

1066

if parent_id is None:

1067

raise NotVersionedError(path=parent_path)

1068

ie = make_entry(kind, parts[-1], parent_id, file_id)

1069

return self.add(ie)

1070

1071

def __delitem__(self, file_id):

1072

"""Remove entry by id.

1073

1074

>>> inv = Inventory()

1075

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1076

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)

1077

>>> '123' in inv

1078

True

1079

>>> del inv['123']

1080

>>> '123' in inv

1081

False

1082

"""

1083

ie = self[file_id]

1084

1085

assert ie.parent_id is None or \

1086

self[ie.parent_id].children[ie.name] == ie

1087

1088

del self._byid[file_id]

1089

if ie.parent_id is not None:

1090

del self[ie.parent_id].children[ie.name]

1091

1092

def __eq__(self, other):

1093

"""Compare two sets by comparing their contents.

1094

1095

>>> i1 = Inventory()

1096

>>> i2 = Inventory()

1097

>>> i1 == i2

1098

True

1099

>>> i1.add(InventoryFile('123', 'foo', ROOT_ID))

1100

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

1101

>>> i1 == i2

1102

False

1103

>>> i2.add(InventoryFile('123', 'foo', ROOT_ID))

1104

InventoryFile('123', 'foo', parent_id='TREE_ROOT', sha1=None, len=None)

1105

>>> i1 == i2

1106

True

1107

"""

1108

if not isinstance(other, Inventory):

1109

return NotImplemented

1110

1111

return self._byid == other._byid

1112

1113

def __ne__(self, other):

1114

return not self.__eq__(other)

1115

1116

def __hash__(self):

1117

raise ValueError('not hashable')

1118

1119

def _iter_file_id_parents(self, file_id):

1120

"""Yield the parents of file_id up to the root."""

1121

while file_id != None:

1122

try:

1123

ie = self._byid[file_id]

1124

except KeyError:

1125

raise BzrError("file_id {%s} not found in inventory" % file_id)

1126

yield ie

1127

file_id = ie.parent_id

1128

1129

def get_idpath(self, file_id):

1130

"""Return a list of file_ids for the path to an entry.

1131

1132

The list contains one element for each directory followed by

1133

the id of the file itself. So the length of the returned list

1134

is equal to the depth of the file in the tree, counting the

1135

root directory as depth 1.

1136

"""

1137

p = []

1138

for parent in self._iter_file_id_parents(file_id):

1139

p.insert(0, parent.file_id)

1140

return p

1141

1142

def id2path(self, file_id):

1143

"""Return as a string the path to file_id.

1144

1145

>>> i = Inventory()

1146

>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))

1147

>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))

1148

>>> print i.id2path('foo-id')

1149

src/foo.c

1150

"""

1151

# get all names, skipping root

1152

return '/'.join(reversed(

1153

[parent.name for parent in

1154

self._iter_file_id_parents(file_id)][:-1]))

1155

1156

def path2id(self, name):

1157

"""Walk down through directories to return entry of last component.

1158

1159

names may be either a list of path components, or a single

1160

string, in which case it is automatically split.

1161

1162

This returns the entry of the last component in the path,

1163

which may be either a file or a directory.

1164

1165

Returns None IFF the path is not found.

1166

"""

1167

if isinstance(name, types.StringTypes):

1168

name = splitpath(name)

1169

1170

# mutter("lookup path %r" % name)

1171

1172

parent = self.root

1173

for f in name:

1174

try:

1175

cie = parent.children[f]

1176

assert cie.name == f

1177

assert cie.parent_id == parent.file_id

1178

parent = cie

1179

except KeyError:

1180

# or raise an error?

1181

return None

1182

1183

return parent.file_id

1184

1185

def has_filename(self, names):

1186

return bool(self.path2id(names))

1187

1188

def has_id(self, file_id):

1189

return self._byid.has_key(file_id)

1190

1191

def rename(self, file_id, new_parent_id, new_name):

1192

"""Move a file within the inventory.

1193

1194

This can change either the name, or the parent, or both.

1195

1196

This does not move the working file."""

1197

if not is_valid_name(new_name):

1198

raise BzrError("not an acceptable filename: %r" % new_name)

1199

1200

new_parent = self._byid[new_parent_id]

1201

if new_name in new_parent.children:

1202

raise BzrError("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

1203

1204

new_parent_idpath = self.get_idpath(new_parent_id)

1205

if file_id in new_parent_idpath:

1206

raise BzrError("cannot move directory %r into a subdirectory of itself, %r"

1207

% (self.id2path(file_id), self.id2path(new_parent_id)))

1208

1209

file_ie = self._byid[file_id]

1210

old_parent = self._byid[file_ie.parent_id]

1211

1212

# TODO: Don't leave things messed up if this fails

1213

1214

del old_parent.children[file_ie.name]

1215

new_parent.children[new_name] = file_ie

1216

1217

file_ie.name = new_name

1218

file_ie.parent_id = new_parent_id

1219

1220

1221

def make_entry(kind, name, parent_id, file_id=None):

1222

"""Create an inventory entry.

1223

1224

:param kind: the type of inventory entry to create.

1225

:param name: the basename of the entry.

1226

:param parent_id: the parent_id of the entry.

1227

:param file_id: the file_id to use. if None, one will be created.

1228

"""

1229

if file_id is None:

1230

file_id = bzrlib.workingtree.gen_file_id(name)

1231

if kind == 'directory':

1232

return InventoryDirectory(file_id, name, parent_id)

1233

elif kind == 'file':

1234

return InventoryFile(file_id, name, parent_id)

1235

elif kind == 'symlink':

1236

return InventoryLink(file_id, name, parent_id)

1237

else:

1238

raise BzrError("unknown kind %r" % kind)

1239

1240

1241

1242

_NAME_RE = None

1243

1244

def is_valid_name(name):

1245

global _NAME_RE

1246

if _NAME_RE is None:

1247

_NAME_RE = re.compile(r'^[^/\\]+$')

1248

1249

return bool(_NAME_RE.match(name))

Older »