/brz/remove-bazaar : revision 753

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/inventory.py

Committer: Martin Pool
Date: 2005-06-22 08:12:31 UTC
Revision ID: mbp@sourcefrog.net-20050622081231-630e514240ccb87a

- new exception NotVersionedError
- raise this from Inventory.add_path if parent isnt versioned

files added:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzr-man.py

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge_core.py

bzrlib/newinventory.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/selftest

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/statcache.py

bzrlib/status.py

bzrlib/store.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/workingtree.py

bzrlib/xml.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

elementtree

elementtree/ElementTree.py

elementtree/__init__.py

notes

notes/new-inventory-sample.xml

notes/performance.txt

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

setup.py

testbzr

urlgrabber

urlgrabber/__init__.py

urlgrabber/byterange.py

urlgrabber/grabber.py

urlgrabber/keepalive.py

urlgrabber/mirror.py

urlgrabber/progress.py

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/inventory.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# This should really be an id randomly assigned when the tree is

# created, but it's not for now.

ROOT_ID = "TREE_ROOT"

import sys, os.path, types, re

try:

from cElementTree import Element, ElementTree, SubElement

except ImportError:

from elementtree.ElementTree import Element, ElementTree, SubElement

from bzrlib.xml import XMLMixin

from bzrlib.errors import BzrError, BzrCheckError

import bzrlib

from bzrlib.osutils import uuid, quotefn, splitpath, joinpath, appendpath

from bzrlib.trace import mutter

class InventoryEntry(XMLMixin):

"""Description of a versioned file.

An InventoryEntry has the following fields, which are also

present in the XML inventory-entry element:

* *file_id*

* *name*: (only the basename within the directory, must not

contain slashes)

* *kind*: "directory" or "file"

* *directory_id*: (if absent/null means the branch root directory)

* *text_sha1*: only for files

* *text_size*: in bytes, only for files

* *text_id*: identifier for the text version, only for files

InventoryEntries can also exist inside a WorkingTree

inventory, in which case they are not yet bound to a

particular revision of the file. In that case the text_sha1,

text_size and text_id are absent.

>>> i = Inventory()

>>> i.path2id('')

'TREE_ROOT'

>>> i.add(InventoryEntry('123', 'src', 'directory', ROOT_ID))

>>> i.add(InventoryEntry('2323', 'hello.c', 'file', parent_id='123'))

>>> for j in i.iter_entries():

... print j

...

('src', InventoryEntry('123', 'src', kind='directory', parent_id='TREE_ROOT'))

('src/hello.c', InventoryEntry('2323', 'hello.c', kind='file', parent_id='123'))

>>> i.add(InventoryEntry('2323', 'bye.c', 'file', '123'))

Traceback (most recent call last):

...

BzrError: inventory already contains entry with id {2323}

>>> i.add(InventoryEntry('2324', 'bye.c', 'file', '123'))

>>> i.add(InventoryEntry('2325', 'wibble', 'directory', '123'))

>>> i.path2id('src/wibble')

'2325'

>>> '2325' in i

True

>>> i.add(InventoryEntry('2326', 'wibble.c', 'file', '2325'))

>>> i['2326']

InventoryEntry('2326', 'wibble.c', kind='file', parent_id='2325')

>>> for j in i.iter_entries():

... print j[0]

... assert i.path2id(j[0])

...

src

src/bye.c

src/hello.c

src/wibble

src/wibble/wibble.c

>>> i.id2path('2326')

'src/wibble/wibble.c'

TODO: Maybe also keep the full path of the entry, and the children?

But those depend on its position within a particular inventory, and

it would be nice not to need to hold the backpointer here.

"""

# TODO: split InventoryEntry into subclasses for files,

# directories, etc etc.

100

101

text_sha1 = None

102

text_size = None

103

104

def __init__(self, file_id, name, kind, parent_id, text_id=None):

105

"""Create an InventoryEntry

106

107

The filename must be a single component, relative to the

108

parent directory; it cannot be a whole path or relative name.

109

110

>>> e = InventoryEntry('123', 'hello.c', 'file', ROOT_ID)

111

>>> e.name

112

'hello.c'

113

>>> e.file_id

114

'123'

115

>>> e = InventoryEntry('123', 'src/hello.c', 'file', ROOT_ID)

116

Traceback (most recent call last):

117

BzrCheckError: InventoryEntry name 'src/hello.c' is invalid

118

"""

119

if '/' in name or '\\' in name:

120

raise BzrCheckError('InventoryEntry name %r is invalid' % name)

121

122

self.file_id = file_id

123

self.name = name

124

self.kind = kind

125

self.text_id = text_id

126

self.parent_id = parent_id

127

if kind == 'directory':

128

self.children = {}

129

elif kind == 'file':

130

pass

131

else:

132

raise BzrError("unhandled entry kind %r" % kind)

133

134

135

136

def sorted_children(self):

137

l = self.children.items()

138

l.sort()

139

return l

140

141

142

def copy(self):

143

other = InventoryEntry(self.file_id, self.name, self.kind,

144

self.parent_id, text_id=self.text_id)

145

other.text_sha1 = self.text_sha1

146

other.text_size = self.text_size

147

# note that children are *not* copied; they're pulled across when

148

# others are added

149

return other

150

151

152

def __repr__(self):

153

return ("%s(%r, %r, kind=%r, parent_id=%r)"

154

% (self.__class__.__name__,

155

self.file_id,

156

self.name,

157

self.kind,

158

self.parent_id))

159

160

161

def to_element(self):

162

"""Convert to XML element"""

163

e = Element('entry')

164

165

e.set('name', self.name)

166

e.set('file_id', self.file_id)

167

e.set('kind', self.kind)

168

169

if self.text_size != None:

170

e.set('text_size', '%d' % self.text_size)

171

172

for f in ['text_id', 'text_sha1']:

173

v = getattr(self, f)

174

if v != None:

175

e.set(f, v)

176

177

# to be conservative, we don't externalize the root pointers

178

# for now, leaving them as null in the xml form. in a future

179

# version it will be implied by nested elements.

180

if self.parent_id != ROOT_ID:

181

assert isinstance(self.parent_id, basestring)

182

e.set('parent_id', self.parent_id)

183

184

e.tail = '\n'

185

186

return e

187

188

189

def from_element(cls, elt):

190

assert elt.tag == 'entry'

191

192

## original format inventories don't have a parent_id for

193

## nodes in the root directory, but it's cleaner to use one

194

## internally.

195

parent_id = elt.get('parent_id')

196

if parent_id == None:

197

parent_id = ROOT_ID

198

199

self = cls(elt.get('file_id'), elt.get('name'), elt.get('kind'), parent_id)

200

self.text_id = elt.get('text_id')

201

self.text_sha1 = elt.get('text_sha1')

202

203

## mutter("read inventoryentry: %r" % (elt.attrib))

204

205

v = elt.get('text_size')

206

self.text_size = v and int(v)

207

208

return self

209

210

211

from_element = classmethod(from_element)

212

213

def __eq__(self, other):

214

if not isinstance(other, InventoryEntry):

215

return NotImplemented

216

217

return (self.file_id == other.file_id) \

218

and (self.name == other.name) \

219

and (self.text_sha1 == other.text_sha1) \

220

and (self.text_size == other.text_size) \

221

and (self.text_id == other.text_id) \

222

and (self.parent_id == other.parent_id) \

223

and (self.kind == other.kind)

224

225

226

def __ne__(self, other):

227

return not (self == other)

228

229

def __hash__(self):

230

raise ValueError('not hashable')

231

232

233

234

class RootEntry(InventoryEntry):

235

def __init__(self, file_id):

236

self.file_id = file_id

237

self.children = {}

238

self.kind = 'root_directory'

239

self.parent_id = None

240

self.name = ''

241

242

def __eq__(self, other):

243

if not isinstance(other, RootEntry):

244

return NotImplemented

245

246

return (self.file_id == other.file_id) \

247

and (self.children == other.children)

248

249

250

251

class Inventory(XMLMixin):

252

"""Inventory of versioned files in a tree.

253

254

This describes which file_id is present at each point in the tree,

255

and possibly the SHA-1 or other information about the file.

256

Entries can be looked up either by path or by file_id.

257

258

The inventory represents a typical unix file tree, with

259

directories containing files and subdirectories. We never store

260

the full path to a file, because renaming a directory implicitly

261

moves all of its contents. This class internally maintains a

262

lookup tree that allows the children under a directory to be

263

returned quickly.

264

265

InventoryEntry objects must not be modified after they are

266

inserted, other than through the Inventory API.

267

268

>>> inv = Inventory()

269

>>> inv.write_xml(sys.stdout)

270

271

</inventory>

272

>>> inv.add(InventoryEntry('123-123', 'hello.c', 'file', ROOT_ID))

273

>>> inv['123-123'].name

274

'hello.c'

275

276

May be treated as an iterator or set to look up file ids:

277

278

>>> bool(inv.path2id('hello.c'))

279

True

280

>>> '123-123' in inv

281

True

282

283

May also look up by name:

284

285

>>> [x[0] for x in inv.iter_entries()]

286

['hello.c']

287

288

>>> inv.write_xml(sys.stdout)

289

290

291

</inventory>

292

293

"""

294

def __init__(self):

295

"""Create or read an inventory.

296

297

If a working directory is specified, the inventory is read

298

from there. If the file is specified, read from that. If not,

299

the inventory is created empty.

300

301

The inventory is created with a default root directory, with

302

an id of None.

303

"""

304

self.root = RootEntry(ROOT_ID)

305

self._byid = {self.root.file_id: self.root}

306

307

308

def __iter__(self):

309

return iter(self._byid)

310

311

312

def __len__(self):

313

"""Returns number of entries."""

314

return len(self._byid)

315

316

317

def iter_entries(self, from_dir=None):

318

"""Return (path, entry) pairs, in order by name."""

319

if from_dir == None:

320

assert self.root

321

from_dir = self.root

322

elif isinstance(from_dir, basestring):

323

from_dir = self._byid[from_dir]

324

325

kids = from_dir.children.items()

326

kids.sort()

327

for name, ie in kids:

328

yield name, ie

329

if ie.kind == 'directory':

330

for cn, cie in self.iter_entries(from_dir=ie.file_id):

331

yield os.path.join(name, cn), cie

332

333

334

def entries(self):

335

"""Return list of (path, ie) for all entries except the root.

336

337

This may be faster than iter_entries.

338

"""

339

accum = []

340

def descend(dir_ie, dir_path):

341

kids = dir_ie.children.items()

342

kids.sort()

343

for name, ie in kids:

344

child_path = os.path.join(dir_path, name)

345

accum.append((child_path, ie))

346

if ie.kind == 'directory':

347

descend(ie, child_path)

348

349

descend(self.root, '')

350

return accum

351

352

353

def directories(self):

354

"""Return (path, entry) pairs for all directories, including the root.

355

"""

356

accum = []

357

def descend(parent_ie, parent_path):

358

accum.append((parent_path, parent_ie))

359

360

kids = [(ie.name, ie) for ie in parent_ie.children.itervalues() if ie.kind == 'directory']

361

kids.sort()

362

363

for name, child_ie in kids:

364

child_path = os.path.join(parent_path, name)

365

descend(child_ie, child_path)

366

descend(self.root, '')

367

return accum

368

369

370

371

def __contains__(self, file_id):

372

"""True if this entry contains a file with given id.

373

374

>>> inv = Inventory()

375

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

376

>>> '123' in inv

377

True

378

>>> '456' in inv

379

False

380

"""

381

return file_id in self._byid

382

383

384

def __getitem__(self, file_id):

385

"""Return the entry for given file_id.

386

387

>>> inv = Inventory()

388

>>> inv.add(InventoryEntry('123123', 'hello.c', 'file', ROOT_ID))

389

>>> inv['123123'].name

390

'hello.c'

391

"""

392

try:

393

return self._byid[file_id]

394

except KeyError:

395

if file_id == None:

396

raise BzrError("can't look up file_id None")

397

else:

398

raise BzrError("file_id {%s} not in inventory" % file_id)

399

400

401

def get_file_kind(self, file_id):

402

return self._byid[file_id].kind

403

404

def get_child(self, parent_id, filename):

405

return self[parent_id].children.get(filename)

406

407

408

def add(self, entry):

409

"""Add entry to inventory.

410

411

To add a file to a branch ready to be committed, use Branch.add,

412

which calls this."""

413

if entry.file_id in self._byid:

414

raise BzrError("inventory already contains entry with id {%s}" % entry.file_id)

415

416

try:

417

parent = self._byid[entry.parent_id]

418

except KeyError:

419

raise BzrError("parent_id {%s} not in inventory" % entry.parent_id)

420

421

if parent.children.has_key(entry.name):

422

raise BzrError("%s is already versioned" %

423

appendpath(self.id2path(parent.file_id), entry.name))

424

425

self._byid[entry.file_id] = entry

426

parent.children[entry.name] = entry

427

428

429

def add_path(self, relpath, kind, file_id=None):

430

"""Add entry from a path.

431

432

The immediate parent must already be versioned"""

433

from bzrlib.errors import NotVersionedError

434

435

parts = bzrlib.osutils.splitpath(relpath)

436

if len(parts) == 0:

437

raise BzrError("cannot re-add root of inventory")

438

439

if file_id == None:

440

file_id = bzrlib.branch.gen_file_id(relpath)

441

442

parent_path = parts[:-1]

443

parent_id = self.path2id(parent_path)

444

if parent_id == None:

445

raise NotVersionedError(parent_path)

446

447

ie = InventoryEntry(file_id, parts[-1],

448

kind=kind, parent_id=parent_id)

449

return self.add(ie)

450

451

452

def __delitem__(self, file_id):

453

"""Remove entry by id.

454

455

>>> inv = Inventory()

456

>>> inv.add(InventoryEntry('123', 'foo.c', 'file', ROOT_ID))

457

>>> '123' in inv

458

True

459

>>> del inv['123']

460

>>> '123' in inv

461

False

462

"""

463

ie = self[file_id]

464

465

assert self[ie.parent_id].children[ie.name] == ie

466

467

# TODO: Test deleting all children; maybe hoist to a separate

468

# deltree method?

469

if ie.kind == 'directory':

470

for cie in ie.children.values():

471

del self[cie.file_id]

472

del ie.children

473

474

del self._byid[file_id]

475

del self[ie.parent_id].children[ie.name]

476

477

478

def to_element(self):

479

"""Convert to XML Element"""

480

e = Element('inventory')

481

e.text = '\n'

482

for path, ie in self.iter_entries():

483

e.append(ie.to_element())

484

return e

485

486

487

def from_element(cls, elt):

488

"""Construct from XML Element

489

490

>>> inv = Inventory()

491

>>> inv.add(InventoryEntry('foo.c-123981239', 'foo.c', 'file', ROOT_ID))

492

>>> elt = inv.to_element()

493

>>> inv2 = Inventory.from_element(elt)

494

>>> inv2 == inv

495

True

496

"""

497

assert elt.tag == 'inventory'

498

o = cls()

499

for e in elt:

500

o.add(InventoryEntry.from_element(e))

501

return o

502

503

from_element = classmethod(from_element)

504

505

506

def __eq__(self, other):

507

"""Compare two sets by comparing their contents.

508

509

>>> i1 = Inventory()

510

>>> i2 = Inventory()

511

>>> i1 == i2

512

True

513

>>> i1.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

514

>>> i1 == i2

515

False

516

>>> i2.add(InventoryEntry('123', 'foo', 'file', ROOT_ID))

517

>>> i1 == i2

518

True

519

"""

520

if not isinstance(other, Inventory):

521

return NotImplemented

522

523

if len(self._byid) != len(other._byid):

524

# shortcut: obviously not the same

525

return False

526

527

return self._byid == other._byid

528

529

530

def __ne__(self, other):

531

return not (self == other)

532

533

534

def __hash__(self):

535

raise ValueError('not hashable')

536

537

538

539

def get_idpath(self, file_id):

540

"""Return a list of file_ids for the path to an entry.

541

542

The list contains one element for each directory followed by

543

the id of the file itself. So the length of the returned list

544

is equal to the depth of the file in the tree, counting the

545

root directory as depth 1.

546

"""

547

p = []

548

while file_id != None:

549

try:

550

ie = self._byid[file_id]

551

except KeyError:

552

raise BzrError("file_id {%s} not found in inventory" % file_id)

553

p.insert(0, ie.file_id)

554

file_id = ie.parent_id

555

return p

556

557

558

def id2path(self, file_id):

559

"""Return as a list the path to file_id."""

560

561

# get all names, skipping root

562

p = [self[fid].name for fid in self.get_idpath(file_id)[1:]]

563

return os.sep.join(p)

564

565

566

567

def path2id(self, name):

568

"""Walk down through directories to return entry of last component.

569

570

names may be either a list of path components, or a single

571

string, in which case it is automatically split.

572

573

This returns the entry of the last component in the path,

574

which may be either a file or a directory.

575

576

Returns None iff the path is not found.

577

"""

578

if isinstance(name, types.StringTypes):

579

name = splitpath(name)

580

581

mutter("lookup path %r" % name)

582

583

parent = self.root

584

for f in name:

585

try:

586

cie = parent.children[f]

587

assert cie.name == f

588

assert cie.parent_id == parent.file_id

589

parent = cie

590

except KeyError:

591

# or raise an error?

592

return None

593

594

return parent.file_id

595

596

597

def has_filename(self, names):

598

return bool(self.path2id(names))

599

600

601

def has_id(self, file_id):

602

return self._byid.has_key(file_id)

603

604

605

def rename(self, file_id, new_parent_id, new_name):

606

"""Move a file within the inventory.

607

608

This can change either the name, or the parent, or both.

609

610

This does not move the working file."""

611

if not is_valid_name(new_name):

612

raise BzrError("not an acceptable filename: %r" % new_name)

613

614

new_parent = self._byid[new_parent_id]

615

if new_name in new_parent.children:

616

raise BzrError("%r already exists in %r" % (new_name, self.id2path(new_parent_id)))

617

618

new_parent_idpath = self.get_idpath(new_parent_id)

619

if file_id in new_parent_idpath:

620

raise BzrError("cannot move directory %r into a subdirectory of itself, %r"

621

% (self.id2path(file_id), self.id2path(new_parent_id)))

622

623

file_ie = self._byid[file_id]

624

old_parent = self._byid[file_ie.parent_id]

625

626

# TODO: Don't leave things messed up if this fails

627

628

del old_parent.children[file_ie.name]

629

new_parent.children[new_name] = file_ie

630

631

file_ie.name = new_name

632

file_ie.parent_id = new_parent_id

633

634

635

636

637

_NAME_RE = re.compile(r'^[^/\\]+$')

638

639

def is_valid_name(name):

640

return bool(_NAME_RE.match(name))

Older »