/brz/remove-bazaar : revision 2255.2.45

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/dirstate.py

Committer: Robert Collins
Date: 2007-02-14 09:32:11 UTC
mto: (2255.5.1 dirstate) (2321.1.1 integration)
mto: This revision was merged to the branch mainline in revision 2322.
Revision ID: robertc@robertcollins.net-20070214093211-hwsla8ly0tfycav4

Dirstate - fix revision_tree() behaviour to match the interface contract.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/repofmt

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/HttpServer.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/smart.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/README.1st

doc/bazaar-vcs.org.kid

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/http_smart_server.txt

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

doc/version_info.txt

generate_docs.py

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

.testr.conf

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

filegraph.py

help.py

hg.py

info.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

tests/test_unpeel_map.py

tests/test_workingtree.py

transportgit.py

tree.py

unpeel_map.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/dirstate.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""DirState objects record the state of a directory and its bzr metadata.

Pseduo EBNF grammar for the disk format:

MINIKIND = "f" | "d" | "l";

NL = "\n";

NULL = "\0";

WHOLE NUMBER = {digit}, digit;

dirstate format = header line, full checksum, row count, parent details,

ghost_details, rows;

header line = "#bazaar dirstate flat format 1", NL;

full checksum = "adler32: ", ["-"], WHOLE NUMBER, NL;

row count = "num_entries: ", digit, NL;

parent_details = WHOLE NUMBER, NULL, NL; XXX: complete this line

ghost_details = WHOLE NUMBER, NULL, {GHOST_ID NULL}*, NL;

rows = dirname, NULL, basename, NULL, MINIKIND, NULL, fileid_utf8, NULL,

WHOLE NUMBER (* size *), NULL, packed stat, NULL, sha1|symlink target,

{PARENT ROW}

PARENT ROW = NULL, revision_utf8, NULL, MINIKIND, NULL, dirname, NULL,

basename, NULL, WHOLE NUMBER (* size *), NULL, "y" | "n", NULL,

SHA1

PARENT ROW's are emitted for every parent that is not in the ghosts details

line. That is, if the parents are foo, bar, baz, and the ghosts are bar, then

each row will have a PARENT ROW for foo and baz, but not for bar.

----

Design priorities:

1) Fast end to end use for bzr's top 5 uses cases.

2) fall back current object model as needed.

3) scale usably to the largest trees known today - say 50K entries.

Locking:

Eventually reuse dirstate objects across locks IFF the dirstate file has not

been modified, but will require that we flush/ignore cached stat-hit data

because we wont want to restat all files on disk just because a lock was

acquired, yet we cannot trust the data after the previous lock was released.

Memory representation:

vecter of all directories, and vector of the childen ?

i.e.

root_row = (direntry for root, [parent_direntries_for_root]),

dirblocks = [

('', ['data for achild', 'data for bchild', 'data for cchild'])

('dir', ['achild', 'cchild', 'echild'])

]

- single bisect to find N subtrees from a path spec

- in-order for serialisation - this is 'dirblock' grouping.

- insertion of a file '/a' affects only the '/' child-vector, that is, to

insert 10K elements from scratch does not generates O(N^2) memoves of a

single vector, rather each individual, which tends to be limited to a

manageable number. Will scale badly on trees with 10K entries in a

single directory. compare with Inventory.InventoryDirectory which has

a dictionary for the children. No bisect capability, can only probe for

exact matches, or grab all elements and sorta.

- Whats the risk of error here? Once we have the base format being processed

we should have a net win regardless of optimality. So we are going to

go with what seems reasonably.

open questions:

maybe we should do a test profile of these core structure - 10K simulated searches/lookups/etc?

Objects for each row?

The lifetime of Dirstate objects is current per lock, but see above for

possible extensions. The lifetime of a row from a dirstate is expected to be

very short in the optimistic case: which we are optimising for. For instance,

subtree status will determine from analysis of the disk data what rows need to

be examined at all, and will be able to determine from a single row whether

that file has altered or not, so we are aiming to process tens of thousands of

entries each second within the dirstate context, before exposing anything to

the larger codebase. This suggests we want the time for a single file

comparison to be < 0.1 milliseconds. That would give us 10000 paths per second

processed, and to scale to 100 thousand we'll another order of magnitude to do

that. Now, as the lifetime for all unchanged entries is the time to parse, stat

the file on disk, and then immediately discard, the overhead of object creation

becomes a significant cost.

Figures: Creating a tuple from from 3 elements was profiled at 0.0625

microseconds, whereas creating a object which is subclassed from tuple was

0.500 microseconds, and creating an object with 3 elements and slots was 3

microseconds long. 0.1 milliseconds is 100 microseconds, and ideally we'll get

100

down to 10 microseconds for the total processing - having 33% of that be object

101

creation is a huge overhead. There is a potential cost in using tuples within

102

each row which is that the conditional code to do comparisons may be slower

103

than method invocation, but method invocation is known to be slow due to stack

104

frame creation, so avoiding methods in these tight inner loops in unfortunately

105

desirable. We can consider a pyrex version of this with objects in future if

106

desired.

107

108

"""

109

110

111

import base64

112

import bisect

113

import cStringIO

114

import os

115

import sha

116

import struct

117

import zlib

118

119

from bzrlib import (

120

errors,

121

trace,

122

)

123

import bzrlib.inventory

124

from bzrlib.osutils import pathjoin, sha_file, sha_string, walkdirs

125

126

127

class DirState(object):

128

"""Record directory and metadata state for fast access.

129

130

A dirstate is a specialised data structure for managing local working

131

tree state information. Its not yet well defined whether it is platform

132

specific, and if it is how we detect/parameterise that.

133

"""

134

135

_kind_to_minikind = {'file':'f', 'directory':'d', 'symlink':'l'}

136

_minikind_to_kind = {'f':'file', 'd':'directory', 'l':'symlink'}

137

_to_yesno = {True:'y', False: 'n'} # TODO profile the performance gain

138

# of using int conversion rather than a dict here. AND BLAME ANDREW IF

139

# it is faster.

140

141

NOT_IN_MEMORY = 0

142

IN_MEMORY_UNMODIFIED = 1

143

IN_MEMORY_MODIFIED = 2

144

145

NULLSTAT = 'x' * 32

146

147

def __init__(self):

148

"""Create a DirState object.

149

150

Attributes of note:

151

152

:attr _root_row: The root row of the directory/file information,

153

- contains the path to / - '', ''

154

- kind of 'directory',

155

- the file id of the root in utf8

156

- size of 0

157

- a packed state

158

- and no sha information.

159

"""

160

# _header_state and _dirblock_state represent the current state

161

# of the dirstate metadata and the per-row data respectiely.

162

# NOT_IN_MEMORY indicates that no data is in memory

163

# IN_MEMORY_UNMODIFIED indicates that what we have in memory

164

# is the same as is on disk

165

# IN_MEMORY_MODIFIED indicates that we have a modified version

166

# of what is on disk.

167

# In future we will add more granularity, for instance _dirblock_state

168

# will probably support partially-in-memory as a separate variable,

169

# allowing for partially-in-memory unmodified and partially-in-memory

170

# modified states.

171

self._header_state = DirState.NOT_IN_MEMORY

172

self._dirblock_state = DirState.NOT_IN_MEMORY

173

self._dirblocks = []

174

self._ghosts = []

175

self._parents = []

176

self._root_row = None

177

self._state_file=None

178

179

def add(self, path, file_id, kind, stat, link_or_sha1):

180

"""Add a path to be tracked.

181

182

:param path: The path within the dirstate - '' is the root, 'foo' is the

183

path foo within the root, 'foo/bar' is the path bar within foo

184

within the root.

185

:param file_id: The file id of the path being added.

186

:param kind: The kind of the path.

187

:param stat: The output of os.lstate for the path.

188

:param link_or_sha1: The sha value of the file, or the target of a

189

symlink. '' for directories.

190

"""

191

# adding a file:

192

# find the block its in.

193

# find the location in the block.

194

# check its not there

195

# add it.

196

self._read_dirblocks_if_needed()

197

utf8path = path.encode('utf8')

198

dirname, basename = os.path.split(utf8path)

199

block_index = self._find_dirblock_index(dirname)

200

if block_index < 0:

201

# some parent path has not been added - its an error to add this

202

# child

203

raise errors.NotVersionedError(path, str(self))

204

block = self._dirblocks[block_index][1]

205

if stat is None:

206

size = 0

207

packed_stat = DirState.NULLSTAT

208

else:

209

size = stat.st_size

210

packed_stat = pack_stat(stat)

211

if kind == 'file':

212

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

213

size, packed_stat, link_or_sha1), [])

214

elif kind == 'directory':

215

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

216

0, packed_stat, ''), [])

217

elif kind == 'symlink':

218

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

219

size, packed_stat, link_or_sha1), [])

220

else:

221

raise errors.BzrError('unknown kind %r' % kind)

222

row_index = bisect.bisect_left(block, row_data)

223

if len(block) > row_index:

224

assert block[row_index][0][1] != basename, \

225

"basename %r already added" % basename

226

block.insert(row_index, row_data)

227

228

if kind == 'directory':

229

# insert a new dirblock

230

bisect.insort_left(self._dirblocks, (utf8path, []))

231

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

232

233

def add_deleted(self, fileid_utf8, parents):

234

"""Add fileid_utf8 with parents as deleted."""

235

self._read_dirblocks_if_needed()

236

new_row = self._make_deleted_row(fileid_utf8, parents)

237

block_index = self._find_dirblock_index(new_row[0][0])

238

if block_index < 0:

239

# no deleted block yet.

240

bisect.insort_left(self._dirblocks, (new_row[0][0], []))

241

block_index = self._find_dirblock_index(new_row[0][0])

242

block = self._dirblocks[block_index][1]

243

row_index = bisect.insort_left(block, new_row)

244

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

245

246

def _find_dirblock_index(self, dirname):

247

"""Find the dirblock index for dirname.

248

249

:return: -1 if the dirname is not present, or the index in

250

self._dirblocks for it otherwise.

251

"""

252

block_index = bisect.bisect_left(self._dirblocks, (dirname, []))

253

if (block_index == len(self._dirblocks) or

254

self._dirblocks[block_index][0] != dirname):

255

return -1

256

return block_index

257

258

@staticmethod

259

def from_tree(tree, dir_state_filename):

260

"""Create a dirstate from a bzr Tree.

261

262

:param tree: The tree which should provide parent information and

263

inventory ids.

264

"""

265

# XXX: aka the big ugly.

266

result = DirState()

267

result._state_file = open(dir_state_filename, 'wb+')

268

269

_encode = base64.encodestring

270

271

parent_ids = tree.get_parent_ids()

272

num_parents = len(parent_ids)

273

if num_parents > 3:

274

raise ValueError('Cannot handle more than 3 parents')

275

276

parent_trees = []

277

for parent_id in parent_ids:

278

parent_trees.append(tree.branch.repository.revision_tree(parent_id))

279

280

# FIXME: is this utf8 safe?

281

282

to_minikind = DirState._kind_to_minikind

283

to_yesno = DirState._to_yesno

284

285

st = os.lstat(tree.basedir)

286

root_info = (

287

'', '' # No path

288

, 'directory', tree.inventory.root.file_id.encode('utf8')

289

, 0 # no point having a size for dirs.

290

, pack_stat(st)

291

, '' # No sha

292

)

293

root_parents = []

294

for parent_tree in parent_trees:

295

root_parents.append((

296

parent_tree.inventory.root.revision.encode('utf8'),

297

'directory', '',

298

'',

299

'',

300

False,

301

'',

302

))

303

304

root_row = (root_info, root_parents)

305

dirblocks = []

306

for dirinfo, block in tree.walkdirs():

307

# dirinfo is path, id

308

to_remove = []

309

# add the row for this block

310

block_row = []

311

dirblocks.append((dirinfo[0], block_row))

312

for relpath, name, kind, st, fileid, versionedkind in block:

313

if fileid is None:

314

# unversioned file, skip

315

continue

316

# TODO? factor out this loop body as a helper function ?

317

s = None

318

dirname, basename = os.path.split(relpath.encode('utf8'))

319

if kind == 'file':

320

s = tree.get_file_sha1(fileid, relpath)

321

elif kind == 'directory':

322

if name in ('.bzr', '.hg', 'CVS', '.svn', '_svn'):

323

raise Exception('skipping dirs not supported yet')

324

# Skip this, and all children

325

to_remove.append((relpath, name, kind, st, abspath))

326

continue

327

# no sha value

328

s = ''

329

elif kind == 'symlink':

330

# sha value of the link target ?!

331

s = os.readlink(abspath)

332

parent_info = []

333

for count in xrange(num_parents):

334

parent_info.append(

335

result._parent_info(parent_trees[count], fileid))

336

row_data = (dirname.encode('utf8'), basename.encode('utf8'),

337

kind, fileid.encode('utf8'), st.st_size, pack_stat(st),

338

339

block_row.append((row_data, parent_info))

340

341

# It isn't safe to remove entries while we are iterating

342

# over the same list, so remove them now

343

for entry in to_remove:

344

block.remove(entry)

345

346

#lines.append(result._get_parents_line(parent_ids))

347

#lines.append(result._get_ghosts_line([]))

348

result._set_data(parent_ids, root_row, dirblocks)

349

result.save()

350

return result

351

352

def get_ghosts(self):

353

"""Return a list of the parent tree revision ids that are ghosts."""

354

self._read_header_if_needed()

355

return self._ghosts

356

357

def get_lines(self):

358

"""Serialise the entire dirstate to a sequence of lines."""

359

if (self._header_state == DirState.IN_MEMORY_UNMODIFIED and

360

self._dirblock_state == DirState.IN_MEMORY_UNMODIFIED):

361

# read whats on disk.

362

self._state_file.seek(0)

363

return self._state_file.readlines()

364

lines = []

365

lines.append(self._get_parents_line(self.get_parent_ids()))

366

lines.append(self._get_ghosts_line(self._ghosts))

367

# append the root line which is special cased

368

lines.extend(map(self._row_to_line, self._iter_rows()))

369

return self._get_output_lines(lines)

370

371

def _get_ghosts_line(self, ghost_ids):

372

"""Create a line for the state file for ghost information."""

373

return '\0'.join([str(len(ghost_ids))] + ghost_ids)

374

375

def _get_parents_line(self, parent_ids):

376

"""Create a line for the state file for parents information."""

377

return '\0'.join([str(len(parent_ids))] + parent_ids)

378

379

def get_parent_ids(self):

380

"""Return a list of the parent tree ids for the directory state."""

381

self._read_header_if_needed()

382

return list(self._parents)

383

384

@staticmethod

385

def initialize(path):

386

"""Create a new dirstate on path.

387

388

The new dirstate will be an empty tree - that is it has no parents,

389

and only a root node - which has id ROOT_ID.

390

391

:param path: The name of the file for the dirstate.

392

:return: A DirState object.

393

"""

394

# This constructs a new DirState object on a path, sets the _state_file

395

# to a new empty file for that path. It then calls _set_data() with our

396

# stock empty dirstate information - a root with ROOT_ID, no children,

397

# and no parents. Finally it calls save() to ensure that this data will

398

# persist.

399

result = DirState()

400

result._state_file = open(path, 'wb+')

401

# a new root directory, with a pack_stat (the x's) that is just noise and will

402

# never match the output of base64 encode.

403

root_row_data = ('', '', 'directory', bzrlib.inventory.ROOT_ID, 0,

404

DirState.NULLSTAT, '')

405

root_parents = []

406

root_row = (root_row_data, root_parents)

407

empty_tree_dirblocks = [('', [])] # root dir contents - no entries.

408

result._set_data([], root_row, empty_tree_dirblocks)

409

try:

410

result.save()

411

except:

412

result._state_file.close()

413

raise

414

return result

415

416

def _iter_rows(self):

417

"""Iterate over all the row data in the dirstate.

418

419

Each yelt item is a tuple of (row_data, parent_data_list).

420

"""

421

self._read_dirblocks_if_needed()

422

yield self._root_row

423

for directory in self._dirblocks:

424

for row in directory[1]:

425

yield row

426

427

def _get_output_lines(self, lines):

428

"""format lines for final output.

429

430

:param lines: A sequece of lines containing the parents list and the

431

path lines.

432

"""

433

output_lines = ['#bazaar dirstate flat format 1\n']

434

lines.append('') # a final newline

435

inventory_text = '\0\n\0'.join(lines)

436

output_lines.append('adler32: %s\n' % (zlib.adler32(inventory_text),))

437

# -3, 1 for num parents, 1 for ghosts, 1 for final newline

438

num_entries = len(lines)-3

439

output_lines.append('num_entries: %s\n' % (num_entries,))

440

output_lines.append(inventory_text)

441

return output_lines

442

443

def _make_deleted_row(self, fileid_utf8, parents):

444

"""Return a deleted for for fileid_utf8."""

445

return ('/', 'RECYCLED.BIN', 'file', fileid_utf8, 0, DirState.NULLSTAT,

446

''), parents

447

448

@staticmethod

449

def on_file(path):

450

"""Construct a DirState on the file at path path."""

451

result = DirState()

452

result._state_file = open(path, 'rb+')

453

return result

454

455

def _parent_info(self, parent_tree, fileid):

456

"""Generate the parent information for file_id in parent_tree."""

457

# FIXME: This is probably expensive - we encode the path that in the

458

# common case will be the same across all parents, twice.

459

# also, id2path is slow in inventory, and we should make that fast.

460

try:

461

parent_entry = parent_tree.inventory[fileid]

462

except errors.NoSuchId:

463

# this parent does not have fileid - return a bogus entry, which

464

# will be filtered out on iteration etc.

465

# an empty revision id is bogus and safe to put on disk

466

# we make it be a 'file', just because. We give it the

467

# deleted file path dirname and basename, 0 size, not executable

468

# and no sha1.

469

return ('', 'file', '/', 'RECYCLED.BIN', 0, False, '')

470

parent_path = parent_tree.inventory.id2path(fileid)

471

dirname, basename = os.path.split(parent_path.encode('utf8'))

472

return (parent_entry.revision.encode('utf8'),

473

parent_entry.kind,

474

# FIXME: set these from the parent

475

dirname.encode('utf8'), basename.encode('utf8'),

476

parent_entry.text_size or 0,

477

parent_entry.executable,

478

parent_entry.text_sha1 or '',

479

)

480

481

def _read_dirblocks_if_needed(self):

482

"""Read in all the dirblocks from the file if they are not in memory."""

483

self._read_header_if_needed()

484

if self._dirblock_state == DirState.NOT_IN_MEMORY:

485

# the _state_file pointer will be positioned at the start of the

486

# dirblocks.

487

text = self._state_file.read()

488

# TODO: check the adler checksums. adler_measured = zlib.adler32(text)

489

490

fields = text.split('\0')

491

# Remove the last blank entry

492

trailing = fields.pop()

493

assert trailing == ''

494

# consider turning fields into a tuple.

495

496

# skip the first field which is the trailing null from the header.

497

cur = 1

498

# Each line now has an extra '\n' field which is not used

499

# so we just skip over it

500

# number of fields per dir_entry

501

# + number of fields per parent_entry

502

# + newline

503

num_present_parents = len(self._parents) - len(self._ghosts)

504

entry_size = 7 + (7 * (num_present_parents)) + 1

505

expected_field_count = entry_size * self._num_entries

506

if len(fields) - cur > expected_field_count:

507

fields = fields[:expected_field_count + cur]

508

trace.mutter('Unexpectedly long dirstate field count!')

509

print "XXX: incorrectly truncated dirstate file bug triggered."

510

field_count = len(fields)

511

# this checks our adjustment, and also catches file too short.

512

assert field_count - cur == expected_field_count, \

513

'field count incorrect %s != %s, entry_size=%s, '\

514

'num_entries=%s fields=%r' % (

515

field_count - cur, expected_field_count, entry_size,

516

self._num_entries, fields)

517

518

# Fast path the case where there are 1 or 2 parents

519

if num_present_parents == 0:

520

entries = [(fields[pos:pos+7], []) for pos in xrange(cur, field_count, entry_size)]

521

elif num_present_parents == 1:

522

entries = [(fields[pos:pos+7], [fields[pos+7:pos+14],])

523

for pos in xrange(cur, field_count, entry_size)]

524

elif num_present_parents == 2:

525

entries = [(fields[pos:pos+7], [

526

fields[pos+7:pos+14],

527

fields[pos+14:pos+21],])

528

for pos in xrange(cur, field_count, entry_size)]

529

else:

530

entries = [(

531

fields[pos:pos+7],

532

tuple([fields[chunk:chunk+7] for

533

chunk in xrange(pos + 7, pos+entry_size-1, 7)]))

534

for pos in xrange(cur, field_count, entry_size)

535

]

536

537

assert len(entries) == self._num_entries, '%s != %s entries' % (len(entries),

538

self._num_entries)

539

540

def _line_to_row(line):

541

"""Convert a freshly read line's size and minikind for use."""

542

# convert the minikind to kind

543

line[0][2] = self._minikind_to_kind[line[0][2]]

544

# convert the size to an int

545

line[0][4] = int(line[0][4])

546

for parent in line[1]:

547

parent[1] = self._minikind_to_kind[parent[1]]

548

parent[4] = int(parent[4])

549

parent[5] = parent[5] == 'y'

550

return tuple(line[0]), map(tuple, line[1])

551

new_rows = map(_line_to_row, entries)

552

self._rows_to_current_state(new_rows)

553

self._dirblock_state = DirState.IN_MEMORY_UNMODIFIED

554

555

def _read_header(self):

556

"""This reads in the metadata header, and the parent ids.

557

558

After reading in, the file should be positioned at the null

559

just before the start of the first record in the file.

560

561

:return: (expected adler checksum, number of entries, parent list)

562

"""

563

self._read_prelude()

564

parent_line = self._state_file.readline()

565

info = parent_line.split('\0')

566

num_parents = int(info[0])

567

assert num_parents == len(info)-2, 'incorrect parent info line'

568

self._parents = [p.decode('utf8') for p in info[1:-1]]

569

570

ghost_line = self._state_file.readline()

571

info = ghost_line.split('\0')

572

num_ghosts = int(info[1])

573

assert num_ghosts == len(info)-3, 'incorrect ghost info line'

574

self._ghosts = [p.decode('utf8') for p in info[2:-1]]

575

self._header_state = DirState.IN_MEMORY_UNMODIFIED

576

577

def _read_header_if_needed(self):

578

"""Read the header of the dirstate file if needed."""

579

if self._header_state == DirState.NOT_IN_MEMORY:

580

self._read_header()

581

582

def _read_prelude(self):

583

"""Read in the prelude header of the dirstate file

584

585

This only reads in the stuff that is not connected to the adler

586

checksum. The position will be correct to read in the rest of

587

the file and check the checksum after this point.

588

The next entry in the file should be the number of parents,

589

and their ids. Followed by a newline.

590

"""

591

header = self._state_file.readline()

592

assert header == '#bazaar dirstate flat format 1\n', \

593

'invalid header line: %r' % (header,)

594

adler_line = self._state_file.readline()

595

assert adler_line.startswith('adler32: '), 'missing adler32 checksum'

596

self.adler_expected = int(adler_line[len('adler32: '):-1])

597

num_entries_line = self._state_file.readline()

598

assert num_entries_line.startswith('num_entries: '), 'missing num_entries line'

599

self._num_entries = int(num_entries_line[len('num_entries: '):-1])

600

601

def _row_to_line(self, row):

602

"""Serialize row to a NULL delimited line ready for _get_output_lines.

603

604

:param row: A row_tuple as defined in the module docstring.

605

"""

606

entire_row = list(row[0])

607

for parent_number, parent_data in enumerate(row[1]):

608

# (revision, kind, dirname, basename, size, executable_bool, sha1)

609

entire_row.extend(parent_data)

610

# minikind conversion of the parent

611

parent_offset = 7 + parent_number * 7

612

entire_row[parent_offset + 1] = DirState._kind_to_minikind[parent_data[1]]

613

entire_row[parent_offset + 4] = str(parent_data[4])

614

entire_row[parent_offset + 5] = DirState._to_yesno[parent_data[5]]

615

# conversion from memory to disk-ready format:

616

# minikind conversion of the current row type.

617

entire_row[2] = DirState._kind_to_minikind[entire_row[2]]

618

entire_row[4] = str(entire_row[4])

619

# minikind of parents

620

return '\0'.join(entire_row)

621

622

def _rows_to_current_state(self, new_rows):

623

"""Load new_rows into self._root_row and self.dirblocks.

624

625

Process new_rows into the current state object, making them the active

626

state.

627

628

:param new_rows: A sorted list of rows. This function does not sort

629

to prevent unneeded overhead when callers have a sorted list

630

already.

631

:return: Nothing.

632

"""

633

assert new_rows[0][0][0:2] == ('', ''), \

634

"Incorrect root row %r" % new_rows[0][0]

635

self._root_row = new_rows[0]

636

self._dirblocks = [('', [])]

637

for row in new_rows[1:]:

638

if row[0] != self._dirblocks[-1][0]:

639

# new block

640

self._dirblocks.append((row[0][0], []))

641

# append the row to the current block

642

self._dirblocks[-1][1].append(row)

643

644

def save(self):

645

"""Save any pending changes created during this session.

646

647

We reuse the existing file, because that prevents race conditions with

648

file creation, and we expect to be using oslocks on it in the near

649

future to prevent concurrent modification and reads - because dirstates

650

incremental data aggretation is not compatible with reading a modified

651

file, and replacing a file in use by another process is impossible on

652

windows.

653

654

A dirstate in read only mode should be smart enough though to validate

655

that the file has not changed, and otherwise discard its cache and

656

start over, to allow for fine grained read lock duration, so 'status'

657

wont block 'commit' - for example.

658

"""

659

if (self._header_state == DirState.IN_MEMORY_MODIFIED or

660

self._dirblock_state == DirState.IN_MEMORY_MODIFIED):

661

self._state_file.seek(0)

662

self._state_file.writelines(self.get_lines())

663

self._state_file.truncate()

664

self._state_file.flush()

665

self._header_state = DirState.IN_MEMORY_UNMODIFIED

666

self._dirblock_state = DirState.IN_MEMORY_UNMODIFIED

667

668

def _set_data(self, parent_ids, root_row, dirblocks):

669

"""Set the full dirstate data in memory.

670

671

This is an internal function used to completely replace the objects

672

in memory state. It puts the dirstate into state 'full-dirty'.

673

674

:param parent_ids: A list of parent tree revision ids.

675

:param root_row: The root row - a tuple of the root direntry and the

676

list of matching direntries from the parent_ids trees.

677

:param dirblocks: A list containing one tuple for each directory in the

678

tree. Each tuple contains the directory path and a list of

679

row data in the same format as root_row.

680

"""

681

# our memory copy is now authoritative.

682

self._dirblocks = dirblocks

683

self._root_row = root_row

684

self._header_state = DirState.IN_MEMORY_MODIFIED

685

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

686

self._parents = list(parent_ids)

687

688

def set_path_id(self, path, new_id):

689

"""Change the id of path to new_id.

690

691

:param path: The path inside the tree to set - '' is the root, 'foo'

692

is the path foo in the root.

693

:param new_id: The new id to assign to the path. If unicode, it will

694

be encoded to utf8. In future this will be deprecated: avoid using

695

unicode ids if possible.

696

"""

697

# TODO: start warning here.

698

if new_id.__class__ == unicode:

699

new_id = new_id.encode('utf8')

700

self._read_dirblocks_if_needed()

701

if new_id == self._root_row[0][3]:

702

# the root id is unchanged

703

return

704

if len(path) or len(self._parents):

705

import pdb;pdb.set_trace()

706

# logic not written

707

raise NotImplementedError(self.set_path_id)

708

root_info, root_parents = self._root_row

709

self._root_row = (root_info[0:3] + (new_id, ) + root_info[4:7]), root_parents

710

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

711

712

def set_parent_trees(self, trees, ghosts):

713

"""Set the parent trees for the dirstate.

714

715

:param trees: A list of revision_id, tree tuples. tree must be provided

716

even if the revision_id refers to a ghost: supply an empty tree in

717

this case.

718

:param ghosts: A list of the revision_ids that are ghosts at the time

719

of setting.

720

"""

721

# TODO: generate a list of parent indexes to preserve to save

722

# processing specific parent trees. In the common case one tree will

723

# be preserved - the left most parent.

724

# TODO: if the parent tree is a dirstate, we might want to walk them

725

# all by path in parallel for 'optimal' common-case performance.

726

# generate new root row.

727

self._read_dirblocks_if_needed()

728

old_root = self._root_row

729

root_info = self._root_row[0]

730

new_parent_count = len(trees)

731

# sketch: loop over all rows in the dirstate, cherry picking

732

# entries from the parent trees, if they are not ghosts.

733

# after we finish walking the dirstate, all entries not in the dirstate

734

# are deletes, so we want to append them to the end as per the design

735

# discussions. So do a set difference on ids with the parents to

736

# get deletes, and add them to the end.

737

new_rows = []

738

# skip ghost trees, as they dont get represented.

739

parent_trees = [tree for rev_id, tree in trees if rev_id not in ghosts]

740

parent_tree_count = len(parent_trees)

741

# loop over existing entries in the dirstate.

742

checked_ids = set()

743

for entry, old_parents in self._iter_rows():

744

file_id = entry[3]

745

checked_ids.add(file_id)

746

new_parents = [None] * parent_tree_count

747

for position, parent_tree in enumerate(parent_trees):

748

# revision_utf8, KIND, dirname, basename, size, executable, sha

749

new_parents[position] = self._parent_info(parent_tree, file_id)

750

assert None not in new_parents

751

new_rows.append((entry, new_parents))

752

# get additional ids that are present in parents and not in this tree.

753

deleted_ids = set()

754

for tree in parent_trees:

755

deleted_ids.update(set(tree.inventory._byid).difference(checked_ids))

756

# add the deleted ids to the dirstate. deleted files are represented as

757

# a file with dirname '', basename ''

758

for file_id in deleted_ids:

759

# add these ids to the deleted block

760

checked_ids.add(file_id)

761

# deleted items have a synthetic entry.

762

entry = ('/', 'RECYCLED.BIN', 'file', file_id.encode('utf8'), 0,

763

DirState.NULLSTAT, '')

764

new_parents = [None] * parent_tree_count

765

for position, parent_tree in enumerate(parent_trees):

766

# revision_utf8, KIND, dirname, basename, size, executable, sha

767

new_parents[position] = self._parent_info(parent_tree, file_id)

768

assert None not in new_parents

769

new_rows.append((entry, new_parents))

770

771

# sort all the rows

772

new_rows = sorted(new_rows)

773

self._rows_to_current_state(new_rows)

774

self._parents = [rev_id for rev_id, tree in trees]

775

self._ghosts = list(ghosts)

776

self._header_state = DirState.IN_MEMORY_MODIFIED

777

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

778

779

def set_state_from_inventory(self, new_inv):

780

"""Set new_inv as the current state.

781

782

:param new_inv: The inventory object to set current state from.

783

"""

784

self._read_dirblocks_if_needed()

785

# sketch:

786

# generate a byid index of the dirstate

787

parent_rows = {}

788

for row, parents in self._iter_rows():

789

parent_rows[row[3]] = parents

790

# walk the new inventory in directory order, copying parent data

791

# from the id index

792

new_rows = []

793

for path, entry in new_inv.iter_entries_by_dir():

794

dirname, basename = os.path.split(path.encode('utf8'))

795

kind = entry.kind

796

fileid_utf8 = entry.file_id.encode('utf8')

797

if kind == 'file':

798

size = entry.text_size or 0

799

sha1 = entry.text_sha1 or ''

800

elif kind == 'symlink':

801

size = 0

802

sha1 = (entry.symlink_target or '').encode('utf8')

803

else:

804

size = 0

805

sha1 = ''

806

try:

807

parents = parent_rows[fileid_utf8]

808

del parent_rows[fileid_utf8]

809

except KeyError:

810

parents = []

811

new_row = (dirname, basename, kind, fileid_utf8, size, DirState.NULLSTAT, sha1), parents

812

new_rows.append(new_row)

813

# append deleted data to the end of the tree as usual.

814

for fileid_utf8, parents in parent_rows.items():

815

if not parents:

816

# this row was only present in the old state, had no parents

817

continue

818

# deleted items have a synthetic entry.

819

new_row = ('/', 'RECYCLED.BIN', 'file', fileid_utf8, 0,

820

DirState.NULLSTAT, ''), parents

821

new_rows.append(new_row)

822

823

# sort all the rows (the ones in parents not in current may be unsorted)

824

new_rows = sorted(new_rows)

825

self._rows_to_current_state(new_rows)

826

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

827

828

829

def pack_stat(st, _encode=base64.encodestring, _pack=struct.pack):

830

"""Convert stat values into a packed representation."""

831

# jam 20060614 it isn't really worth removing more entries if we

832

# are going to leave it in packed form.

833

# With only st_mtime and st_mode filesize is 5.5M and read time is 275ms

834

# With all entries filesize is 5.9M and read time is mabye 280ms

835

# well within the noise margin

836

837

# base64.encode always adds a final newline, so strip it off

838

return _encode(_pack('>llllll'

839

, st.st_size, st.st_mtime, st.st_ctime

840

, st.st_dev, st.st_ino, st.st_mode))[:-1]

841

Older »