/brz/remove-bazaar : revision 1731.1.17

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: Aaron Bentley
Date: 2006-06-08 10:37:56 UTC
mfrom: (1752 +trunk)
mto: (1907.1.1 no-special-root) (2100.3.5 by-reference-trees) (1731.2.8 nested-trees)
mto: This revision was merged to the branch mainline in revision 1910.
Revision ID: aaron.bentley@utoronto.ca-20060608103756-6a854ecf75030d42

Merge bzr.dev

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/read_bundle.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v07.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

foo bar

generate_docs.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: This refactoring of the workingtree code doesn't seem to keep

# the WorkingTree's copy of the inventory in sync with the branch. The

# branch modifies its working inventory when it does a commit to make

# missing files permanently removed.

# TODO: Maybe also keep the full path of the entry, and the children?

# But those depend on its position within a particular inventory, and

# it would be nice not to need to hold the backpointer here.

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import collections

import os.path

import re

import sys

import tarfile

import types

import bzrlib

from bzrlib.osutils import (pumpfile, quotefn, splitpath, joinpath,

pathjoin, sha_strings)

from bzrlib.errors import (NotVersionedError, InvalidEntryName,

BzrError, BzrCheckError, BinaryFile)

from bzrlib.trace import mutter

class InventoryEntry(object):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

file_id

name

(within the parent directory)

parent_id

file_id of the parent directory, or ROOT_ID

revision

the revision_id in which this variation of this file was

introduced.

executable

Indicates that this file should be executable on systems

that support it.

text_sha1

sha-1 of the text of the file

text_size

size in bytes of the text of the file

(reading a version 4 tree created a text_id field.)

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))

InventoryDirectory('123', 'src', parent_id='TREE_ROOT')

>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))

InventoryFile('2323', 'hello.c', parent_id='123')

>>> shouldbe = {0: 'src', 1: pathjoin('src','hello.c')}

>>> for ix, j in enumerate(i.iter_entries()):

... print (j[0] == shouldbe[ix], j[1])

...

(True, InventoryDirectory('123', 'src', parent_id='TREE_ROOT'))

(True, InventoryFile('2323', 'hello.c', parent_id='123'))

>>> i.add(InventoryFile('2323', 'bye.c', '123'))

Traceback (most recent call last):

...

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryFile('2324', 'bye.c', '123'))

InventoryFile('2324', 'bye.c', parent_id='123')

>>> i.add(InventoryDirectory('2325', 'wibble', '123'))

InventoryDirectory('2325', 'wibble', parent_id='123')

>>> i.path2id('src/wibble')

'2325'

>>> '2325' in i

100

True

101

>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))

102

InventoryFile('2326', 'wibble.c', parent_id='2325')

103

>>> i['2326']

104

InventoryFile('2326', 'wibble.c', parent_id='2325')

105

>>> for path, entry in i.iter_entries():

106

... print path

107

... assert i.path2id(path)

108

...

109

src

110

src/bye.c

111

src/hello.c

112

src/wibble

113

src/wibble/wibble.c

114

>>> i.id2path('2326')

115

'src/wibble/wibble.c'

116

"""

117

118

# Constants returned by describe_change()

119

120

# TODO: These should probably move to some kind of FileChangeDescription

121

# class; that's like what's inside a TreeDelta but we want to be able to

122

# generate them just for one file at a time.

123

RENAMED = 'renamed'

124

MODIFIED_AND_RENAMED = 'modified and renamed'

125

126

__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',

127

'text_id', 'parent_id', 'children', 'executable',

128

'revision']

129

130

def _add_text_to_weave(self, new_lines, parents, weave_store, transaction):

131

versionedfile = weave_store.get_weave_or_empty(self.file_id,

132

transaction)

133

versionedfile.add_lines(self.revision, parents, new_lines)

134

versionedfile.clear_cache()

135

136

def detect_changes(self, old_entry):

137

"""Return a (text_modified, meta_modified) from this to old_entry.

138

139

_read_tree_state must have been called on self and old_entry prior to

140

calling detect_changes.

141

"""

142

return False, False

143

144

def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

145

output_to, reverse=False):

146

"""Perform a diff from this to to_entry.

147

148

text_diff will be used for textual difference calculation.

149

This is a template method, override _diff in child classes.

150

"""

151

self._read_tree_state(tree.id2path(self.file_id), tree)

152

if to_entry:

153

# cannot diff from one kind to another - you must do a removal

154

# and an addif they do not match.

155

assert self.kind == to_entry.kind

156

to_entry._read_tree_state(to_tree.id2path(to_entry.file_id),

157

to_tree)

158

self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,

159

output_to, reverse)

160

161

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

162

output_to, reverse=False):

163

"""Perform a diff between two entries of the same kind."""

164

165

def find_previous_heads(self, previous_inventories,

166

versioned_file_store,

167

transaction,

168

entry_vf=None):

169

"""Return the revisions and entries that directly preceed this.

170

171

Returned as a map from revision to inventory entry.

172

173

This is a map containing the file revisions in all parents

174

for which the file exists, and its revision is not a parent of

175

any other. If the file is new, the set will be empty.

176

177

:param versioned_file_store: A store where ancestry data on this

178

file id can be queried.

179

:param transaction: The transaction that queries to the versioned

180

file store should be completed under.

181

:param entry_vf: The entry versioned file, if its already available.

182

"""

183

def get_ancestors(weave, entry):

184

return set(weave.get_ancestry(entry.revision))

185

# revision:ie mapping for each ie found in previous_inventories.

186

candidates = {}

187

# revision:ie mapping with one revision for each head.

188

heads = {}

189

# revision: ancestor list for each head

190

head_ancestors = {}

191

# identify candidate head revision ids.

192

for inv in previous_inventories:

193

if self.file_id in inv:

194

ie = inv[self.file_id]

195

assert ie.file_id == self.file_id

196

if ie.revision in candidates:

197

# same revision value in two different inventories:

198

# correct possible inconsistencies:

199

# * there was a bug in revision updates with 'x' bit

200

# support.

201

try:

202

if candidates[ie.revision].executable != ie.executable:

203

candidates[ie.revision].executable = False

204

ie.executable = False

205

except AttributeError:

206

pass

207

# must now be the same.

208

assert candidates[ie.revision] == ie

209

else:

210

# add this revision as a candidate.

211

candidates[ie.revision] = ie

212

213

# common case optimisation

214

if len(candidates) == 1:

215

# if there is only one candidate revision found

216

# then we can opening the versioned file to access ancestry:

217

# there cannot be any ancestors to eliminate when there is

218

# only one revision available.

219

heads[ie.revision] = ie

220

return heads

221

222

# eliminate ancestors amongst the available candidates:

223

# heads are those that are not an ancestor of any other candidate

224

# - this provides convergence at a per-file level.

225

for ie in candidates.values():

226

# may be an ancestor of a known head:

227

already_present = 0 != len(

228

[head for head in heads

229

if ie.revision in head_ancestors[head]])

230

if already_present:

231

# an ancestor of an analyzed candidate.

232

continue

233

# not an ancestor of a known head:

234

# load the versioned file for this file id if needed

235

if entry_vf is None:

236

entry_vf = versioned_file_store.get_weave_or_empty(

237

self.file_id, transaction)

238

ancestors = get_ancestors(entry_vf, ie)

239

# may knock something else out:

240

check_heads = list(heads.keys())

241

for head in check_heads:

242

if head in ancestors:

243

# this previously discovered 'head' is not

244

# really a head - its an ancestor of the newly

245

# found head,

246

heads.pop(head)

247

head_ancestors[ie.revision] = ancestors

248

heads[ie.revision] = ie

249

return heads

250

251

def get_tar_item(self, root, dp, now, tree):

252

"""Get a tarfile item and a file stream for its content."""

253

item = tarfile.TarInfo(pathjoin(root, dp))

254

# TODO: would be cool to actually set it to the timestamp of the

255

# revision it was last changed

256

item.mtime = now

257

fileobj = self._put_in_tar(item, tree)

258

return item, fileobj

259

260

def has_text(self):

261

"""Return true if the object this entry represents has textual data.

262

263

Note that textual data includes binary content.

264

265

Also note that all entries get weave files created for them.

266

This attribute is primarily used when upgrading from old trees that

267

did not have the weave index for all inventory entries.

268

"""

269

return False

270

271

def __init__(self, file_id, name, parent_id, text_id=None):

272

"""Create an InventoryEntry

273

274

The filename must be a single component, relative to the

275

parent directory; it cannot be a whole path or relative name.

276

277

>>> e = InventoryFile('123', 'hello.c', ROOT_ID)

278

>>> e.name

279

'hello.c'

280

>>> e.file_id

281

'123'

282

>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)

283

Traceback (most recent call last):

284

InvalidEntryName: Invalid entry name: src/hello.c

285

"""

286

assert isinstance(name, basestring), name

287

if '/' in name or '\\' in name:

288

raise InvalidEntryName(name=name)

289

self.executable = False

290

self.revision = None

291

self.text_sha1 = None

292

self.text_size = None

293

self.file_id = file_id

294

self.name = name

295

self.text_id = text_id

296

self.parent_id = parent_id

297

self.symlink_target = None

298

299

def kind_character(self):

300

"""Return a short kind indicator useful for appending to names."""

301

raise BzrError('unknown kind %r' % self.kind)

302

303

known_kinds = ('file', 'directory', 'symlink')

304

305

def _put_in_tar(self, item, tree):

306

"""populate item for stashing in a tar, and return the content stream.

307

308

If no content is available, return None.

309

"""

310

raise BzrError("don't know how to export {%s} of kind %r" %

311

(self.file_id, self.kind))

312

313

def put_on_disk(self, dest, dp, tree):

314

"""Create a representation of self on disk in the prefix dest.

315

316

This is a template method - implement _put_on_disk in subclasses.

317

"""

318

fullpath = pathjoin(dest, dp)

319

self._put_on_disk(fullpath, tree)

320

mutter(" export {%s} kind %s to %s", self.file_id,

321

self.kind, fullpath)

322

323

def _put_on_disk(self, fullpath, tree):

324

"""Put this entry onto disk at fullpath, from tree tree."""

325

raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))

326

327

def sorted_children(self):

328

l = self.children.items()

329

l.sort()

330

return l

331

332

@staticmethod

333

def versionable_kind(kind):

334

return kind in ('file', 'directory', 'symlink')

335

336

def check(self, checker, rev_id, inv, tree):

337

"""Check this inventory entry is intact.

338

339

This is a template method, override _check for kind specific

340

tests.

341

342

:param checker: Check object providing context for the checks;

343

can be used to find out what parts of the repository have already

344

been checked.

345

:param rev_id: Revision id from which this InventoryEntry was loaded.

346

Not necessarily the last-changed revision for this file.

347

:param inv: Inventory from which the entry was loaded.

348

:param tree: RevisionTree for this entry.

349

"""

350

if self.parent_id != None:

351

if not inv.has_id(self.parent_id):

352

raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'

353

% (self.parent_id, rev_id))

354

self._check(checker, rev_id, tree)

355

356

def _check(self, checker, rev_id, tree):

357

"""Check this inventory entry for kind specific errors."""

358

raise BzrCheckError('unknown entry kind %r in revision {%s}' %

359

(self.kind, rev_id))

360

361

def copy(self):

362

"""Clone this inventory entry."""

363

raise NotImplementedError

364

365

@staticmethod

366

def describe_change(old_entry, new_entry):

367

"""Describe the change between old_entry and this.

368

369

This smells of being an InterInventoryEntry situation, but as its

370

the first one, we're making it a static method for now.

371

372

An entry with a different parent, or different name is considered

373

to be renamed. Reparenting is an internal detail.

374

Note that renaming the parent does not trigger a rename for the

375

child entry itself.

376

"""

377

# TODO: Perhaps return an object rather than just a string

378

if old_entry is new_entry:

379

# also the case of both being None

380

return 'unchanged'

381

elif old_entry is None:

382

return 'added'

383

elif new_entry is None:

384

return 'removed'

385

text_modified, meta_modified = new_entry.detect_changes(old_entry)

386

if text_modified or meta_modified:

387

modified = True

388

else:

389

modified = False

390

# TODO 20060511 (mbp, rbc) factor out 'detect_rename' here.

391

if old_entry.parent_id != new_entry.parent_id:

392

renamed = True

393

elif old_entry.name != new_entry.name:

394

renamed = True

395

else:

396

renamed = False

397

if renamed and not modified:

398

return InventoryEntry.RENAMED

399

if modified and not renamed:

400

return 'modified'

401

if modified and renamed:

402

return InventoryEntry.MODIFIED_AND_RENAMED

403

return 'unchanged'

404

405

def __repr__(self):

406

return ("%s(%r, %r, parent_id=%r)"

407

% (self.__class__.__name__,

408

self.file_id,

409

self.name,

410

self.parent_id))

411

412

def snapshot(self, revision, path, previous_entries,

413

work_tree, weave_store, transaction):

414

"""Make a snapshot of this entry which may or may not have changed.

415

416

This means that all its fields are populated, that it has its

417

text stored in the text store or weave.

418

"""

419

mutter('new parents of %s are %r', path, previous_entries)

420

self._read_tree_state(path, work_tree)

421

if len(previous_entries) == 1:

422

# cannot be unchanged unless there is only one parent file rev.

423

parent_ie = previous_entries.values()[0]

424

if self._unchanged(parent_ie):

425

mutter("found unchanged entry")

426

self.revision = parent_ie.revision

427

return "unchanged"

428

return self._snapshot_into_revision(revision, previous_entries,

429

work_tree, weave_store, transaction)

430

431

def _snapshot_into_revision(self, revision, previous_entries, work_tree,

432

weave_store, transaction):

433

"""Record this revision unconditionally into a store.

434

435

The entry's last-changed revision property (`revision`) is updated to

436

that of the new revision.

437

438

:param revision: id of the new revision that is being recorded.

439

440

:returns: String description of the commit (e.g. "merged", "modified"), etc.

441

"""

442

mutter('new revision {%s} for {%s}', revision, self.file_id)

443

self.revision = revision

444

self._snapshot_text(previous_entries, work_tree, weave_store,

445

transaction)

446

447

def _snapshot_text(self, file_parents, work_tree, weave_store, transaction):

448

"""Record the 'text' of this entry, whatever form that takes.

449

450

This default implementation simply adds an empty text.

451

"""

452

mutter('storing file {%s} in revision {%s}',

453

self.file_id, self.revision)

454

self._add_text_to_weave([], file_parents.keys(), weave_store, transaction)

455

456

def __eq__(self, other):

457

if not isinstance(other, InventoryEntry):

458

return NotImplemented

459

460

return ((self.file_id == other.file_id)

461

and (self.name == other.name)

462

and (other.symlink_target == self.symlink_target)

463

and (self.text_sha1 == other.text_sha1)

464

and (self.text_size == other.text_size)

465

and (self.text_id == other.text_id)

466

and (self.parent_id == other.parent_id)

467

and (self.kind == other.kind)

468

and (self.revision == other.revision)

469

and (self.executable == other.executable)

470

)

471

472

def __ne__(self, other):

473

return not (self == other)

474

475

def __hash__(self):

476

raise ValueError('not hashable')

477

478

def _unchanged(self, previous_ie):

479

"""Has this entry changed relative to previous_ie.

480

481

This method should be overriden in child classes.

482

"""

483

compatible = True

484

# different inv parent

485

if previous_ie.parent_id != self.parent_id:

486

compatible = False

487

# renamed

488

elif previous_ie.name != self.name:

489

compatible = False

490

return compatible

491

492

def _read_tree_state(self, path, work_tree):

493

"""Populate fields in the inventory entry from the given tree.

494

495

Note that this should be modified to be a noop on virtual trees

496

as all entries created there are prepopulated.

497

"""

498

# TODO: Rather than running this manually, we should check the

499

# working sha1 and other expensive properties when they're

500

# first requested, or preload them if they're already known

501

pass # nothing to do by default

502

503

def _forget_tree_state(self):

504

pass

505

506

507

class InventoryDirectory(InventoryEntry):

508

"""A directory in an inventory."""

509

510

def _check(self, checker, rev_id, tree):

511

"""See InventoryEntry._check"""

512

if self.text_sha1 != None or self.text_size != None or self.text_id != None:

513

raise BzrCheckError('directory {%s} has text in revision {%s}'

514

% (self.file_id, rev_id))

515

516

def copy(self):

517

other = InventoryDirectory(self.file_id, self.name, self.parent_id)

518

other.revision = self.revision

519

# note that children are *not* copied; they're pulled across when

520

# others are added

521

return other

522

523

def __init__(self, file_id, name, parent_id):

524

super(InventoryDirectory, self).__init__(file_id, name, parent_id)

525

self.children = {}

526

self.kind = 'directory'

527

528

def kind_character(self):

529

"""See InventoryEntry.kind_character."""

530

return '/'

531

532

def _put_in_tar(self, item, tree):

533

"""See InventoryEntry._put_in_tar."""

534

item.type = tarfile.DIRTYPE

535

fileobj = None

536

item.name += '/'

537

item.size = 0

538

item.mode = 0755

539

return fileobj

540

541

def _put_on_disk(self, fullpath, tree):

542

"""See InventoryEntry._put_on_disk."""

543

os.mkdir(fullpath)

544

545

546

class InventoryFile(InventoryEntry):

547

"""A file in an inventory."""

548

549

def _check(self, checker, tree_revision_id, tree):

550

"""See InventoryEntry._check"""

551

t = (self.file_id, self.revision)

552

if t in checker.checked_texts:

553

prev_sha = checker.checked_texts[t]

554

if prev_sha != self.text_sha1:

555

raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %

556

(self.file_id, tree_revision_id))

557

else:

558

checker.repeated_text_cnt += 1

559

return

560

561

if self.file_id not in checker.checked_weaves:

562

mutter('check weave {%s}', self.file_id)

563

w = tree.get_weave(self.file_id)

564

# Not passing a progress bar, because it creates a new

565

# progress, which overwrites the current progress,

566

# and doesn't look nice

567

w.check()

568

checker.checked_weaves[self.file_id] = True

569

else:

570

w = tree.get_weave(self.file_id)

571

572

mutter('check version {%s} of {%s}', tree_revision_id, self.file_id)

573

checker.checked_text_cnt += 1

574

# We can't check the length, because Weave doesn't store that

575

# information, and the whole point of looking at the weave's

576

# sha1sum is that we don't have to extract the text.

577

if self.text_sha1 != w.get_sha1(self.revision):

578

raise BzrCheckError('text {%s} version {%s} wrong sha1'

579

% (self.file_id, self.revision))

580

checker.checked_texts[t] = self.text_sha1

581

582

def copy(self):

583

other = InventoryFile(self.file_id, self.name, self.parent_id)

584

other.executable = self.executable

585

other.text_id = self.text_id

586

other.text_sha1 = self.text_sha1

587

other.text_size = self.text_size

588

other.revision = self.revision

589

return other

590

591

def detect_changes(self, old_entry):

592

"""See InventoryEntry.detect_changes."""

593

assert self.text_sha1 != None

594

assert old_entry.text_sha1 != None

595

text_modified = (self.text_sha1 != old_entry.text_sha1)

596

meta_modified = (self.executable != old_entry.executable)

597

return text_modified, meta_modified

598

599

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

600

output_to, reverse=False):

601

"""See InventoryEntry._diff."""

602

try:

603

from_text = tree.get_file(self.file_id).readlines()

604

if to_entry:

605

to_text = to_tree.get_file(to_entry.file_id).readlines()

606

else:

607

to_text = []

608

if not reverse:

609

text_diff(from_label, from_text,

610

to_label, to_text, output_to)

611

else:

612

text_diff(to_label, to_text,

613

from_label, from_text, output_to)

614

except BinaryFile:

615

if reverse:

616

label_pair = (to_label, from_label)

617

else:

618

label_pair = (from_label, to_label)

619

print >> output_to, "Binary files %s and %s differ" % label_pair

620

621

def has_text(self):

622

"""See InventoryEntry.has_text."""

623

return True

624

625

def __init__(self, file_id, name, parent_id):

626

super(InventoryFile, self).__init__(file_id, name, parent_id)

627

self.kind = 'file'

628

629

def kind_character(self):

630

"""See InventoryEntry.kind_character."""

631

return ''

632

633

def _put_in_tar(self, item, tree):

634

"""See InventoryEntry._put_in_tar."""

635

item.type = tarfile.REGTYPE

636

fileobj = tree.get_file(self.file_id)

637

item.size = self.text_size

638

if tree.is_executable(self.file_id):

639

item.mode = 0755

640

else:

641

item.mode = 0644

642

return fileobj

643

644

def _put_on_disk(self, fullpath, tree):

645

"""See InventoryEntry._put_on_disk."""

646

pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))

647

if tree.is_executable(self.file_id):

648

os.chmod(fullpath, 0755)

649

650

def _read_tree_state(self, path, work_tree):

651

"""See InventoryEntry._read_tree_state."""

652

self.text_sha1 = work_tree.get_file_sha1(self.file_id, path=path)

653

self.executable = work_tree.is_executable(self.file_id, path=path)

654

655

def _forget_tree_state(self):

656

self.text_sha1 = None

657

self.executable = None

658

659

def _snapshot_text(self, file_parents, work_tree, versionedfile_store, transaction):

660

"""See InventoryEntry._snapshot_text."""

661

mutter('storing text of file {%s} in revision {%s} into %r',

662

self.file_id, self.revision, versionedfile_store)

663

# special case to avoid diffing on renames or

664

# reparenting

665

if (len(file_parents) == 1

666

and self.text_sha1 == file_parents.values()[0].text_sha1

667

and self.text_size == file_parents.values()[0].text_size):

668

previous_ie = file_parents.values()[0]

669

versionedfile = versionedfile_store.get_weave(self.file_id, transaction)

670

versionedfile.clone_text(self.revision, previous_ie.revision, file_parents.keys())

671

else:

672

new_lines = work_tree.get_file(self.file_id).readlines()

673

self._add_text_to_weave(new_lines, file_parents.keys(), versionedfile_store,

674

transaction)

675

self.text_sha1 = sha_strings(new_lines)

676

self.text_size = sum(map(len, new_lines))

677

678

679

def _unchanged(self, previous_ie):

680

"""See InventoryEntry._unchanged."""

681

compatible = super(InventoryFile, self)._unchanged(previous_ie)

682

if self.text_sha1 != previous_ie.text_sha1:

683

compatible = False

684

else:

685

# FIXME: 20050930 probe for the text size when getting sha1

686

# in _read_tree_state

687

self.text_size = previous_ie.text_size

688

if self.executable != previous_ie.executable:

689

compatible = False

690

return compatible

691

692

693

class InventoryLink(InventoryEntry):

694

"""A file in an inventory."""

695

696

__slots__ = ['symlink_target']

697

698

def _check(self, checker, rev_id, tree):

699

"""See InventoryEntry._check"""

700

if self.text_sha1 != None or self.text_size != None or self.text_id != None:

701

raise BzrCheckError('symlink {%s} has text in revision {%s}'

702

% (self.file_id, rev_id))

703

if self.symlink_target == None:

704

raise BzrCheckError('symlink {%s} has no target in revision {%s}'

705

% (self.file_id, rev_id))

706

707

def copy(self):

708

other = InventoryLink(self.file_id, self.name, self.parent_id)

709

other.symlink_target = self.symlink_target

710

other.revision = self.revision

711

return other

712

713

def detect_changes(self, old_entry):

714

"""See InventoryEntry.detect_changes."""

715

# FIXME: which _modified field should we use ? RBC 20051003

716

text_modified = (self.symlink_target != old_entry.symlink_target)

717

if text_modified:

718

mutter(" symlink target changed")

719

meta_modified = False

720

return text_modified, meta_modified

721

722

def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,

723

output_to, reverse=False):

724

"""See InventoryEntry._diff."""

725

from_text = self.symlink_target

726

if to_entry is not None:

727

to_text = to_entry.symlink_target

728

if reverse:

729

temp = from_text

730

from_text = to_text

731

to_text = temp

732

print >>output_to, '=== target changed %r => %r' % (from_text, to_text)

733

else:

734

if not reverse:

735

print >>output_to, '=== target was %r' % self.symlink_target

736

else:

737

print >>output_to, '=== target is %r' % self.symlink_target

738

739

def __init__(self, file_id, name, parent_id):

740

super(InventoryLink, self).__init__(file_id, name, parent_id)

741

self.kind = 'symlink'

742

743

def kind_character(self):

744

"""See InventoryEntry.kind_character."""

745

return ''

746

747

def _put_in_tar(self, item, tree):

748

"""See InventoryEntry._put_in_tar."""

749

item.type = tarfile.SYMTYPE

750

fileobj = None

751

item.size = 0

752

item.mode = 0755

753

item.linkname = self.symlink_target

754

return fileobj

755

756

def _put_on_disk(self, fullpath, tree):

757

"""See InventoryEntry._put_on_disk."""

758

try:

759

os.symlink(self.symlink_target, fullpath)

760

except OSError,e:

761

raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))

762

763

def _read_tree_state(self, path, work_tree):

764

"""See InventoryEntry._read_tree_state."""

765

self.symlink_target = work_tree.get_symlink_target(self.file_id)

766

767

def _forget_tree_state(self):

768

self.symlink_target = None

769

770

def _unchanged(self, previous_ie):

771

"""See InventoryEntry._unchanged."""

772

compatible = super(InventoryLink, self)._unchanged(previous_ie)

773

if self.symlink_target != previous_ie.symlink_target:

774

compatible = False

775

return compatible

776

777

778

class Inventory(object):

779

"""Inventory of versioned files in a tree.

780

781

This describes which file_id is present at each point in the tree,

782

and possibly the SHA-1 or other information about the file.

783

Entries can be looked up either by path or by file_id.

784

785

The inventory represents a typical unix file tree, with

786

directories containing files and subdirectories. We never store

787

the full path to a file, because renaming a directory implicitly

788

moves all of its contents. This class internally maintains a

789

lookup tree that allows the children under a directory to be

790

returned quickly.

791

792

InventoryEntry objects must not be modified after they are

793

inserted, other than through the Inventory API.

794

795

>>> inv = Inventory()

796

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

797

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT')

798

>>> inv['123-123'].name

799

'hello.c'

800

801

May be treated as an iterator or set to look up file ids:

802

803

>>> bool(inv.path2id('hello.c'))

804

True

805

>>> '123-123' in inv

806

True

807

808

May also look up by name:

809

810

>>> [x[0] for x in inv.iter_entries()]

811

[u'hello.c']

812

>>> inv = Inventory('TREE_ROOT-12345678-12345678')

813

>>> inv.add(InventoryFile('123-123', 'hello.c', ROOT_ID))

814

InventoryFile('123-123', 'hello.c', parent_id='TREE_ROOT-12345678-12345678')

815

"""

816

def __init__(self, root_id=ROOT_ID, revision_id=None):

817

"""Create or read an inventory.

818

819

If a working directory is specified, the inventory is read

820

from there. If the file is specified, read from that. If not,

821

the inventory is created empty.

822

823

The inventory is created with a default root directory, with

824

an id of None.

825

"""

826

if root_id is not None:

827

self.root = InventoryDirectory(root_id, '', None)

828

self._byid = {self.root.file_id: self.root}

829

else:

830

self.root = None

831

self._byid = {}

832

self.revision_id = revision_id

833

834

835

def copy(self):

836

# TODO: jam 20051218 Should copy also copy the revision_id?

837

other = Inventory(self.root.file_id)

838

# copy recursively so we know directories will be added before

839

# their children. There are more efficient ways than this...

840

for path, entry in self.iter_entries():

841

if entry == self.root:

842

continue

843

other.add(entry.copy())

844

return other

845

846

847

def __iter__(self):

848

return iter(self._byid)

849

850

851

def __len__(self):

852

"""Returns number of entries."""

853

return len(self._byid)

854

855

856

def iter_entries(self, from_dir=None):

857

"""Return (path, entry) pairs, in order by name."""

858

if from_dir == None:

859

if self.root is None:

860

return

861

from_dir = self.root

862

elif isinstance(from_dir, basestring):

863

from_dir = self._byid[from_dir]

864

865

# unrolling the recursive called changed the time from

866

# 440ms/663ms (inline/total) to 116ms/116ms

867

children = from_dir.children.items()

868

children.sort()

869

children = collections.deque(children)

870

stack = [(u'', children)]

871

while stack:

872

from_dir_relpath, children = stack[-1]

873

874

while children:

875

name, ie = children.popleft()

876

877

# we know that from_dir_relpath never ends in a slash

878

# and 'f' doesn't begin with one, we can do a string op, rather

879

# than the checks of pathjoin(), though this means that all paths

880

# start with a slash

881

path = from_dir_relpath + '/' + name

882

883

yield path[1:], ie

884

885

if ie.kind != 'directory':

886

continue

887

888

# But do this child first

889

new_children = ie.children.items()

890

new_children.sort()

891

new_children = collections.deque(new_children)

892

stack.append((path, new_children))

893

# Break out of inner loop, so that we start outer loop with child

894

break

895

else:

896

# if we finished all children, pop it off the stack

897

stack.pop()

898

899

def entries(self):

900

"""Return list of (path, ie) for all entries except the root.

901

902

This may be faster than iter_entries.

903

"""

904

accum = []

905

def descend(dir_ie, dir_path):

906

kids = dir_ie.children.items()

907

kids.sort()

908

for name, ie in kids:

909

child_path = pathjoin(dir_path, name)

910

accum.append((child_path, ie))

911

if ie.kind == 'directory':

912

descend(ie, child_path)

913

914

descend(self.root, u'')

915

return accum

916

917

918

def directories(self):

919

"""Return (path, entry) pairs for all directories, including the root.

920

"""

921

accum = []

922

def descend(parent_ie, parent_path):

923

accum.append((parent_path, parent_ie))

924

925

kids = [(ie.name, ie) for ie in parent_ie.children.itervalues() if ie.kind == 'directory']

926

kids.sort()

927

928

for name, child_ie in kids:

929

child_path = pathjoin(parent_path, name)

930

descend(child_ie, child_path)

931

descend(self.root, u'')

932

return accum

933

934

935

936

def __contains__(self, file_id):

937

"""True if this entry contains a file with given id.

938

939

>>> inv = Inventory()

940

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

941

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT')

942

>>> '123' in inv

943

True

944

>>> '456' in inv

945

False

946

"""

947

return file_id in self._byid

948

949

950

def __getitem__(self, file_id):

951

"""Return the entry for given file_id.

952

953

>>> inv = Inventory()

954

>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))

955

InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT')

956

>>> inv['123123'].name

957

'hello.c'

958

"""

959

try:

960

return self._byid[file_id]

961

except KeyError:

962

if file_id == None:

963

raise BzrError("can't look up file_id None")

964

else:

965

raise BzrError("file_id {%s} not in inventory" % file_id)

966

967

968

def get_file_kind(self, file_id):

969

return self._byid[file_id].kind

970

971

def get_child(self, parent_id, filename):

972

return self[parent_id].children.get(filename)

973

974

975

def add(self, entry):

976

"""Add entry to inventory.

977

978

To add a file to a branch ready to be committed, use Branch.add,

979

which calls this.

980

981

Returns the new entry object.

982

"""

983

if entry.file_id in self._byid:

984

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

985

986

if entry.parent_id == ROOT_ID or entry.parent_id is None:

987

entry.parent_id = self.root.file_id

988

989

try:

990

parent = self._byid[entry.parent_id]

991

except KeyError:

992

raise BzrError("parent_id {%s} not in inventory" % entry.parent_id)

993

994

if parent.children.has_key(entry.name):

995

raise BzrError("%s is already versioned" %

996

pathjoin(self.id2path(parent.file_id), entry.name))

997

998

self._byid[entry.file_id] = entry

999

parent.children[entry.name] = entry

1000

return entry

1001

1002

1003

def add_path(self, relpath, kind, file_id=None, parent_id=None):

1004

"""Add entry from a path.

1005

1006

The immediate parent must already be versioned.

1007

1008

Returns the new entry object."""

1009

1010

parts = bzrlib.osutils.splitpath(relpath)

1011

1012

if len(parts) == 0:

1013

if file_id is None:

1014

file_id = bzrlib.workingtree.gen_root_id()

1015

self.root = InventoryDirectory(file_id, '', None)

1016

self._byid = {self.root.file_id: self.root}

1017

return

1018

else:

1019

parent_path = parts[:-1]

1020

parent_id = self.path2id(parent_path)

1021

if parent_id == None:

1022

raise NotVersionedError(path=parent_path)

1023

ie = make_entry(kind, parts[-1], parent_id, file_id)

1024

return self.add(ie)

1025

1026

def __delitem__(self, file_id):

1027

"""Remove entry by id.

1028

1029

>>> inv = Inventory()

1030

>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))

1031

InventoryFile('123', 'foo.c', parent_id='TREE_ROOT')

1032

>>> '123' in inv

1033

True

1034

>>> del inv['123']

1035

>>> '123' in inv

1036

False

1037

"""

1038

ie = self[file_id]

1039

1040

assert ie.parent_id is None or \

1041

self[ie.parent_id].children[ie.name] == ie

1042

1043

del self._byid[file_id]

1044

if ie.parent_id is not None:

1045

del self[ie.parent_id].children[ie.name]

1046

1047

1048

def __eq__(self, other):

1049

"""Compare two sets by comparing their contents.

1050

1051

>>> i1 = Inventory()

1052

>>> i2 = Inventory()

1053

>>> i1 == i2

1054

True

1055

>>> i1.add(InventoryFile('123', 'foo', ROOT_ID))

1056

InventoryFile('123', 'foo', parent_id='TREE_ROOT')

1057

>>> i1 == i2

1058

False

1059

>>> i2.add(InventoryFile('123', 'foo', ROOT_ID))

1060

InventoryFile('123', 'foo', parent_id='TREE_ROOT')

1061

>>> i1 == i2

1062

True

1063

"""

1064

if not isinstance(other, Inventory):

1065

return NotImplemented

1066

1067

if len(self._byid) != len(other._byid):

1068

# shortcut: obviously not the same

1069

return False

1070

1071

return self._byid == other._byid

1072

1073

1074

def __ne__(self, other):

1075

return not self.__eq__(other)

1076

1077

1078

def __hash__(self):

1079

raise ValueError('not hashable')

1080

1081

def _iter_file_id_parents(self, file_id):

1082

"""Yield the parents of file_id up to the root."""

1083

while file_id != None:

1084

try:

1085

ie = self._byid[file_id]

1086

except KeyError:

1087

raise BzrError("file_id {%s} not found in inventory" % file_id)

1088

yield ie

1089

file_id = ie.parent_id

1090

1091

def get_idpath(self, file_id):

1092

"""Return a list of file_ids for the path to an entry.

1093

1094

The list contains one element for each directory followed by

1095

the id of the file itself. So the length of the returned list

1096

is equal to the depth of the file in the tree, counting the

1097

root directory as depth 1.

1098

"""

1099

p = []

1100

for parent in self._iter_file_id_parents(file_id):

1101

p.insert(0, parent.file_id)

1102

return p

1103

1104

def id2path(self, file_id):

1105

"""Return as a string the path to file_id.

1106

1107

>>> i = Inventory()

1108

>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))

1109

>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))

1110

>>> print i.id2path('foo-id')

1111

src/foo.c

1112

"""

1113

# get all names, skipping root

1114

return '/'.join(reversed(

1115

[parent.name for parent in

1116

self._iter_file_id_parents(file_id)][:-1]))

1117

1118

def path2id(self, name):

1119

"""Walk down through directories to return entry of last component.

1120

1121

names may be either a list of path components, or a single

1122

string, in which case it is automatically split.

1123

1124

This returns the entry of the last component in the path,

1125

which may be either a file or a directory.

1126

1127

Returns None IFF the path is not found.

1128

"""

1129

if isinstance(name, types.StringTypes):

1130

name = splitpath(name)

1131

1132

# mutter("lookup path %r" % name)

1133

1134

parent = self.root

1135

if parent is None:

1136

return None

1137

for f in name:

1138

try:

1139

cie = parent.children[f]

1140

assert cie.name == f

1141

assert cie.parent_id == parent.file_id

1142

parent = cie

1143

except KeyError:

1144

# or raise an error?

1145

return None

1146

1147

return parent.file_id

1148

1149

1150

def has_filename(self, names):

1151

return bool(self.path2id(names))

1152

1153

1154

def has_id(self, file_id):

1155

return self._byid.has_key(file_id)

1156

1157

1158

def rename(self, file_id, new_parent_id, new_name):

1159

"""Move a file within the inventory.

1160

1161

This can change either the name, or the parent, or both.

1162

1163

This does not move the working file."""

1164

if not is_valid_name(new_name):

1165

raise BzrError("not an acceptable filename: %r" % new_name)

1166

1167

new_parent = self._byid[new_parent_id]

1168

if new_name in new_parent.children:

1169

raise BzrError("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

1170

1171

new_parent_idpath = self.get_idpath(new_parent_id)

1172

if file_id in new_parent_idpath:

1173

raise BzrError("cannot move directory %r into a subdirectory of itself, %r"

1174

% (self.id2path(file_id), self.id2path(new_parent_id)))

1175

1176

file_ie = self._byid[file_id]

1177

old_parent = self._byid[file_ie.parent_id]

1178

1179

# TODO: Don't leave things messed up if this fails

1180

1181

del old_parent.children[file_ie.name]

1182

new_parent.children[new_name] = file_ie

1183

1184

file_ie.name = new_name

1185

file_ie.parent_id = new_parent_id

1186

1187

def is_root(self, file_id):

1188

return self.root is not None and file_id == self.root.file_id

1189

1190

1191

def make_entry(kind, name, parent_id, file_id=None):

1192

"""Create an inventory entry.

1193

1194

:param kind: the type of inventory entry to create.

1195

:param name: the basename of the entry.

1196

:param parent_id: the parent_id of the entry.

1197

:param file_id: the file_id to use. if None, one will be created.

1198

"""

1199

if file_id is None:

1200

file_id = bzrlib.workingtree.gen_file_id(name)

1201

if kind == 'directory':

1202

return InventoryDirectory(file_id, name, parent_id)

1203

elif kind == 'file':

1204

return InventoryFile(file_id, name, parent_id)

1205

elif kind == 'symlink':

1206

return InventoryLink(file_id, name, parent_id)

1207

else:

1208

raise BzrError("unknown kind %r" % kind)

1209

1210

1211

1212

_NAME_RE = None

1213

1214

def is_valid_name(name):

1215

global _NAME_RE

1216

if _NAME_RE == None:

1217

_NAME_RE = re.compile(r'^[^/\\]+$')

1218

1219

return bool(_NAME_RE.match(name))

Older »