/brz/remove-bazaar : revision 2255.2.20

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/dirstate.py

Committer: Robert Collins
Date: 2007-02-13 06:15:20 UTC
mto: (2255.5.1 dirstate) (2321.1.1 integration)
mto: This revision was merged to the branch mainline in revision 2322.
Revision ID: robertc@robertcollins.net-20070213061520-3ga0hywdijgr8fxg

Bypass irrelevant basis_inventory tests for dirstate.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/repofmt

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/HttpServer.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/smart.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/README.1st

doc/bazaar-vcs.org.kid

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/http_smart_server.txt

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

doc/version_info.txt

generate_docs.py

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/dirstate.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""DirState objects record the state of a directory and its bzr metadata.

Pseduo EBNF grammar for the disk format:

MINIKIND = "f" | "d" | "l";

NL = "\n";

NULL = "\0";

WHOLE NUMBER = {digit}, digit;

dirstate format = header line, full checksum, row count, parent details,

ghost_details, rows;

header line = "#bazaar dirstate flat format 1", NL;

full checksum = "adler32: ", ["-"], WHOLE NUMBER, NL;

row count = "num_entries: ", digit, NL;

parent_details = WHOLE NUMBER, NULL, NL; XXX: complete this line

ghost_details = WHOLE NUMBER, NULL, {GHOST_ID NULL}*, NL;

rows = dirname, NULL, basename, NULL, MINIKIND, NULL, fileid_utf8, NULL,

WHOLE NUMBER (* size *), NULL, packed stat, NULL, sha1|symlink target,

{PARENT ROW}

PARENT ROW = NULL, revision_utf8, NULL, MINIKIND, NULL, dirname, NULL,

basename, NULL, WHOLE NUMBER (* size *), NULL, "y" | "n", NULL,

SHA1

PARENT ROW's are emitted for every parent that is not in the ghosts details

line. That is, if the parents are foo, bar, baz, and the ghosts are bar, then

each row will have a PARENT ROW for foo and baz, but not for bar.

----

Design priorities:

1) Fast end to end use for bzr's top 5 uses cases.

2) fall back current object model as needed.

3) scale usably to the largest trees known today - say 50K entries.

Locking:

Eventually reuse dirstate objects across locks IFF the dirstate file has not

been modified, but will require that we flush/ignore cached stat-hit data

because we wont want to restat all files on disk just because a lock was

acquired, yet we cannot trust the data after the previous lock was released.

Memory representation:

vecter of all directories, and vector of the childen ?

i.e.

root_row = (direntry for root, [parent_direntries_for_root]),

dirblocks = [

('', ['data for achild', 'data for bchild', 'data for cchild'])

('dir', ['achild', 'cchild', 'echild'])

]

- single bisect to find N subtrees from a path spec

- in-order for serialisation - this is 'dirblock' grouping.

- insertion of a file '/a' affects only the '/' child-vector, that is, to

insert 10K elements from scratch does not generates O(N^2) memoves of a

single vector, rather each individual, which tends to be limited to a

manageable number. Will scale badly on trees with 10K entries in a

single directory. compare with Inventory.InventoryDirectory which has

a dictionary for the children. No bisect capability, can only probe for

exact matches, or grab all elements and sorta.

- Whats the risk of error here? Once we have the base format being processed

we should have a net win regardless of optimality. So we are going to

go with what seems reasonably.

open questions:

maybe we should do a test profile of these core structure - 10K simulated searches/lookups/etc?

Objects for each row?

The lifetime of Dirstate objects is current per lock, but see above for

possible extensions. The lifetime of a row from a dirstate is expected to be

very short in the optimistic case: which we are optimising for. For instance,

subtree status will determine from analysis of the disk data what rows need to

be examined at all, and will be able to determine from a single row whether

that file has altered or not, so we are aiming to process tens of thousands of

entries each second within the dirstate context, before exposing anything to

the larger codebase. This suggests we want the time for a single file

comparison to be < 0.1 milliseconds. That would give us 10000 paths per second

processed, and to scale to 100 thousand we'll another order of magnitude to do

that. Now, as the lifetime for all unchanged entries is the time to parse, stat

the file on disk, and then immediately discard, the overhead of object creation

becomes a significant cost.

Figures: Creating a tuple from from 3 elements was profiled at 0.0625

microseconds, whereas creating a object which is subclassed from tuple was

0.500 microseconds, and creating an object with 3 elements and slots was 3

microseconds long. 0.1 milliseconds is 100 microseconds, and ideally we'll get

100

down to 10 microseconds for the total processing - having 33% of that be object

101

creation is a huge overhead. There is a potential cost in using tuples within

102

each row which is that the conditional code to do comparisons may be slower

103

than method invocation, but method invocation is known to be slow due to stack

104

frame creation, so avoiding methods in these tight inner loops in unfortunately

105

desirable. We can consider a pyrex version of this with objects in future if

106

desired.

107

108

"""

109

110

111

import base64

112

import bisect

113

import cStringIO

114

import os

115

import sha

116

import struct

117

import zlib

118

119

from bzrlib import errors

120

import bzrlib.inventory

121

from bzrlib.osutils import pathjoin, sha_file, sha_string, walkdirs

122

123

124

class DirState(object):

125

"""Record directory and metadata state for fast access.

126

127

A dirstate is a specialised data structure for managing local working

128

tree state information. Its not yet well defined whether it is platform

129

specific, and if it is how we detect/parameterise that.

130

"""

131

132

_kind_to_minikind = {'file':'f', 'directory':'d', 'symlink':'l'}

133

_minikind_to_kind = {'f':'file', 'd':'directory', 'l':'symlink'}

134

_to_yesno = {True:'y', False: 'n'} # TODO profile the performance gain

135

# of using int conversion rather than a dict here. AND BLAME ANDREW IF

136

# it is faster.

137

138

NOT_IN_MEMORY = 0

139

IN_MEMORY_UNMODIFIED = 1

140

IN_MEMORY_MODIFIED = 2

141

142

NULLSTAT = 'x' * 32

143

144

def __init__(self):

145

"""Create a DirState object.

146

147

Attributes of note:

148

149

:attr _root_row: The root row of the directory/file information,

150

- contains the path to / - '', ''

151

- kind of 'directory',

152

- the file id of the root in utf8

153

- size of 0

154

- a packed state

155

- and no sha information.

156

"""

157

# _header_state and _dirblock_state represent the current state

158

# of the dirstate metadata and the per-row data respectiely.

159

# NOT_IN_MEMORY indicates that no data is in memory

160

# IN_MEMORY_UNMODIFIED indicates that what we have in memory

161

# is the same as is on disk

162

# IN_MEMORY_MODIFIED indicates that we have a modified version

163

# of what is on disk.

164

# In future we will add more granularity, for instance _dirblock_state

165

# will probably support partially-in-memory as a separate variable,

166

# allowing for partially-in-memory unmodified and partially-in-memory

167

# modified states.

168

self._header_state = DirState.NOT_IN_MEMORY

169

self._dirblock_state = DirState.NOT_IN_MEMORY

170

self._dirblocks = []

171

self._ghosts = []

172

self._parents = []

173

self._root_row = None

174

self._state_file=None

175

176

def add(self, path, file_id, kind, stat, link_or_sha1):

177

"""Add a path to be tracked.

178

179

:param path: The path within the dirstate - '' is the root, 'foo' is the

180

path foo within the root, 'foo/bar' is the path bar within foo

181

within the root.

182

:param file_id: The file id of the path being added.

183

:param kind: The kind of the path.

184

:param stat: The output of os.lstate for the path.

185

:param link_or_sha1: The sha value of the file, or the target of a

186

symlink. '' for directories.

187

"""

188

# adding a file:

189

# find the block its in.

190

# find the location in the block.

191

# check its not there

192

# add it.

193

self._read_dirblocks_if_needed()

194

utf8path = path.encode('utf8')

195

dirname, basename = os.path.split(utf8path)

196

block_index = bisect.bisect_left(self._dirblocks, (dirname, []))

197

if (block_index == len(self._dirblocks) or

198

self._dirblocks[block_index][0] != dirname):

199

# some parent path has not been added - its an error to add this

200

# child

201

raise errors.NoSuchFile(path)

202

block = self._dirblocks[block_index][1]

203

if kind == 'file':

204

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

205

stat.st_size, pack_stat(stat), link_or_sha1), [])

206

elif kind == 'directory':

207

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

208

0, pack_stat(stat), ''), [])

209

elif kind == 'symlink':

210

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

211

stat.st_size, pack_stat(stat), link_or_sha1), [])

212

else:

213

raise errors.BzrError('unknown kind %r' % kind)

214

row_index = bisect.bisect_left(block, row_data)

215

if len(block) > row_index:

216

assert block[row_index][1] != basename, \

217

"basename %r already added" % basename

218

block.insert(row_index, row_data)

219

220

if kind == 'directory':

221

# insert a new dirblock

222

bisect.insort_left(self._dirblocks, (utf8path, []))

223

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

224

225

def add_parent_tree(self, tree_id, tree):

226

"""Add tree as a parent to this dirstate."""

227

self._read_dirblocks_if_needed()

228

self._parents.append(tree_id)

229

self._header_state = DirState.IN_MEMORY_MODIFIED

230

if tree is None:

231

self._ghosts.append(tree_id)

232

233

@staticmethod

234

def from_tree(tree, dir_state_filename):

235

"""Create a dirstate from a bzr Tree.

236

237

:param tree: The tree which should provide parent information and

238

inventory ids.

239

"""

240

# XXX: aka the big ugly.

241

result = DirState()

242

result._state_file = open(dir_state_filename, 'wb+')

243

244

_encode = base64.encodestring

245

246

parent_ids = tree.get_parent_ids()

247

num_parents = len(parent_ids)

248

if num_parents > 3:

249

raise ValueError('Cannot handle more than 3 parents')

250

251

parent_trees = []

252

for parent_id in parent_ids:

253

parent_trees.append(tree.branch.repository.revision_tree(parent_id))

254

255

# FIXME: is this utf8 safe?

256

257

to_minikind = DirState._kind_to_minikind

258

to_yesno = DirState._to_yesno

259

260

st = os.lstat(tree.basedir)

261

root_info = (

262

'', '' # No path

263

, 'directory', tree.inventory.root.file_id.encode('utf8')

264

, 0 # no point having a size for dirs.

265

, pack_stat(st)

266

, '' # No sha

267

)

268

root_parents = []

269

for parent_tree in parent_trees:

270

root_parents.append((

271

parent_tree.inventory.root.revision.encode('utf8'),

272

'directory', '',

273

'',

274

'',

275

False,

276

'',

277

))

278

279

root_row = (root_info, root_parents)

280

dirblocks = []

281

for dirinfo, block in tree.walkdirs():

282

# dirinfo is path, id

283

to_remove = []

284

# add the row for this block

285

block_row = []

286

dirblocks.append((dirinfo[0], block_row))

287

for relpath, name, kind, st, fileid, versionedkind in block:

288

if fileid is None:

289

# unversioned file, skip

290

continue

291

# TODO? factor out this loop body as a helper function ?

292

s = None

293

dirname, basename = os.path.split(relpath.encode('utf8'))

294

if kind == 'file':

295

s = tree.get_file_sha1(fileid, relpath)

296

elif kind == 'directory':

297

if name in ('.bzr', '.hg', 'CVS', '.svn', '_svn'):

298

raise Exception('skipping dirs not supported yet')

299

# Skip this, and all children

300

to_remove.append((relpath, name, kind, st, abspath))

301

continue

302

# no sha value

303

s = ''

304

elif kind == 'symlink':

305

# sha value of the link target ?!

306

s = os.readlink(abspath)

307

parent_info = []

308

for count in xrange(num_parents):

309

parent_info.append(

310

result._parent_info(parent_trees[count], fileid))

311

row_data = (dirname.encode('utf8'), basename.encode('utf8'),

312

kind, fileid.encode('utf8'), st.st_size, pack_stat(st),

313

314

block_row.append((row_data, parent_info))

315

316

# It isn't safe to remove entries while we are iterating

317

# over the same list, so remove them now

318

for entry in to_remove:

319

block.remove(entry)

320

321

#lines.append(result._get_parents_line(parent_ids))

322

#lines.append(result._get_ghosts_line([]))

323

result._set_data(parent_ids, root_row, dirblocks)

324

result.save()

325

return result

326

327

def get_ghosts(self):

328

"""Return a list of the parent tree revision ids that are ghosts."""

329

self._read_header_if_needed()

330

return self._ghosts

331

332

def get_lines(self):

333

"""Serialise the entire dirstate to a sequence of lines."""

334

if (self._header_state == DirState.IN_MEMORY_UNMODIFIED and

335

self._dirblock_state == DirState.IN_MEMORY_UNMODIFIED):

336

# read whats on disk.

337

self._state_file.seek(0)

338

return self._state_file.readlines()

339

lines = []

340

lines.append(self._get_parents_line(self.get_parent_ids()))

341

lines.append(self._get_ghosts_line(self._ghosts))

342

# append the root line which is special cased

343

lines.extend(map(self._row_to_line, self._iter_rows()))

344

return self._get_output_lines(lines)

345

346

def _get_ghosts_line(self, ghost_ids):

347

"""Create a line for the state file for ghost information."""

348

return '\0'.join([str(len(ghost_ids))] + ghost_ids)

349

350

def _get_parents_line(self, parent_ids):

351

"""Create a line for the state file for parents information."""

352

return '\0'.join([str(len(parent_ids))] + parent_ids)

353

354

def get_parent_ids(self):

355

"""Return a list of the parent tree ids for the directory state."""

356

self._read_header_if_needed()

357

return self._parents

358

359

@staticmethod

360

def initialize(path):

361

"""Create a new dirstate on path.

362

363

The new dirstate will be an empty tree - that is it has no parents,

364

and only a root node - which has id ROOT_ID.

365

366

:param path: The name of the file for the dirstate.

367

:return: A DirState object.

368

"""

369

# This constructs a new DirState object on a path, sets the _state_file

370

# to a new empty file for that path. It then calls _set_data() with our

371

# stock empty dirstate information - a root with ROOT_ID, no children,

372

# and no parents. Finally it calls save() to ensure that this data will

373

# persist.

374

result = DirState()

375

result._state_file = open(path, 'wb+')

376

# a new root directory, with a pack_stat (the x's) that is just noise and will

377

# never match the output of base64 encode.

378

root_row_data = ('', '', 'directory', bzrlib.inventory.ROOT_ID, 0,

379

DirState.NULLSTAT, '')

380

root_parents = []

381

root_row = (root_row_data, root_parents)

382

empty_tree_dirblocks = [('', [])] # root dir contents - no entries.

383

result._set_data([], root_row, empty_tree_dirblocks)

384

try:

385

result.save()

386

except:

387

result._state_file.close()

388

raise

389

return result

390

391

def _iter_rows(self):

392

"""Iterate over all the row data in the dirstate.

393

394

Each yelt item is a tuple of (row_data, parent_data_list).

395

"""

396

self._read_dirblocks_if_needed()

397

yield self._root_row

398

for directory in self._dirblocks:

399

for row in directory[1]:

400

yield row

401

402

def _get_output_lines(self, lines):

403

"""format lines for final output.

404

405

:param lines: A sequece of lines containing the parents list and the

406

path lines.

407

"""

408

output_lines = ['#bazaar dirstate flat format 1\n']

409

lines.append('') # a final newline

410

inventory_text = '\0\n\0'.join(lines)

411

output_lines.append('adler32: %s\n' % (zlib.adler32(inventory_text),))

412

# -3, 1 for num parents, 1 for ghosts, 1 for final newline

413

num_entries = len(lines)-3

414

output_lines.append('num_entries: %s\n' % (num_entries,))

415

output_lines.append(inventory_text)

416

return output_lines

417

418

@staticmethod

419

def on_file(path):

420

"""Construct a DirState on the file at path path."""

421

result = DirState()

422

result._state_file = open(path, 'rb+')

423

return result

424

425

def _parent_info(self, parent_tree, fileid):

426

"""Generate the parent information for file_id in parent_tree."""

427

# FIXME: This is probably expensive - we encode the path that in the

428

# common case will be the same across all parents, twice.

429

# also, id2path is slow in inventory, and we should make that fast.

430

try:

431

parent_entry = parent_tree.inventory[fileid]

432

except errors.NoSuchId:

433

# this parent does not have fileid - return a bogus entry, which

434

# will be filtered out on iteration etc.

435

# an empty revision id is bogus and safe to put on disk

436

# we make it be a 'file', just because. We give it the

437

# deleted file path dirname and basename, 0 size, not executable

438

# and no sha1.

439

return ('', 'file', '/', 'RECYCLED.BIN', 0, False, '')

440

parent_path = parent_tree.inventory.id2path(fileid)

441

dirname, basename = os.path.split(parent_path.encode('utf8'))

442

return (parent_entry.revision.encode('utf8'),

443

parent_entry.kind,

444

# FIXME: set these from the parent

445

dirname.encode('utf8'), basename.encode('utf8'),

446

parent_entry.text_size or 0,

447

parent_entry.executable,

448

parent_entry.text_sha1 or '',

449

)

450

451

def _read_dirblocks_if_needed(self):

452

"""Read in all the dirblocks from the file if they are not in memory."""

453

self._read_header_if_needed()

454

if self._dirblock_state == DirState.NOT_IN_MEMORY:

455

# the _state_file pointer will be positioned at the start of the

456

# dirblocks.

457

text = self._state_file.read()

458

# TODO: check the adler checksums. adler_measured = zlib.adler32(text)

459

460

fields = text.split('\0')

461

# Remove the last blank entry

462

trailing = fields.pop()

463

assert trailing == ''

464

# consider turning fields into a tuple.

465

466

# skip the first field which is the trailing null from the header.

467

cur = 1

468

field_count = len(fields)

469

# Each line now has an extra '\n' field which is not used

470

# so we just skip over it

471

# number of fields per dir_entry + number of fields per parent_entry + newline

472

num_parents = len(self._parents)

473

entry_size = 7 + (7 * (num_parents - len(self._ghosts))) + 1

474

expected_field_count = entry_size * self._num_entries

475

# is the file too short ?

476

assert field_count - cur == expected_field_count, \

477

'field count incorrect %s != %s, entry_size=%s, '\

478

'num_entries=%s fields=%r' % (

479

field_count - cur, expected_field_count, entry_size,

480

self._num_entries, fields)

481

482

# Fast path the case where there are 1 or 2 parents

483

if num_parents == 0:

484

entries = [(fields[pos:pos+7], []) for pos in xrange(cur, field_count, entry_size)]

485

elif num_parents == 1:

486

entries = [(fields[pos:pos+7], [fields[pos+7:pos+14],])

487

for pos in xrange(cur, field_count, entry_size)]

488

elif num_parents == 2:

489

entries = [(fields[pos:pos+7], [

490

fields[pos+7:pos+14],

491

fields[pos+14:pos+21],])

492

for pos in xrange(cur, field_count, entry_size)]

493

else:

494

entries = [(

495

fields[pos:pos+7],

496

tuple([fields[chunk:chunk+7] for

497

chunk in xrange(pos + 7, pos+entry_size-1, 7)]))

498

for pos in xrange(cur, field_count, entry_size)

499

]

500

501

assert len(entries) == self._num_entries, '%s != %s entries' % (len(entries),

502

self._num_entries)

503

504

def _line_to_row(line):

505

"""Convert a freshly read line's size and minikind for use."""

506

# convert the minikind to kind

507

line[0][2] = self._minikind_to_kind[line[0][2]]

508

# convert the size to an int

509

line[0][4] = int(line[0][4])

510

for parent in line[1]:

511

parent[1] = self._minikind_to_kind[parent[1]]

512

parent[4] = int(parent[4])

513

parent[5] = parent[5] == 'y'

514

return tuple(line[0]), map(tuple, line[1])

515

new_rows = map(_line_to_row, entries)

516

self._rows_to_current_state(new_rows)

517

self._dirblock_state = DirState.IN_MEMORY_UNMODIFIED

518

519

def _read_header(self):

520

"""This reads in the metadata header, and the parent ids.

521

522

After reading in, the file should be positioned at the null

523

just before the start of the first record in the file.

524

525

:return: (expected adler checksum, number of entries, parent list)

526

"""

527

self._read_prelude()

528

parent_line = self._state_file.readline()

529

info = parent_line.split('\0')

530

num_parents = int(info[0])

531

assert num_parents == len(info)-2, 'incorrect parent info line'

532

self._parents = [p.decode('utf8') for p in info[1:-1]]

533

534

ghost_line = self._state_file.readline()

535

info = ghost_line.split('\0')

536

num_ghosts = int(info[1])

537

assert num_ghosts == len(info)-3, 'incorrect ghost info line'

538

self._ghosts = [p.decode('utf8') for p in info[2:-1]]

539

self._header_state = DirState.IN_MEMORY_UNMODIFIED

540

541

def _read_header_if_needed(self):

542

"""Read the header of the dirstate file if needed."""

543

if self._header_state == DirState.NOT_IN_MEMORY:

544

self._read_header()

545

546

def _read_prelude(self):

547

"""Read in the prelude header of the dirstate file

548

549

This only reads in the stuff that is not connected to the adler

550

checksum. The position will be correct to read in the rest of

551

the file and check the checksum after this point.

552

The next entry in the file should be the number of parents,

553

and their ids. Followed by a newline.

554

"""

555

header = self._state_file.readline()

556

assert header == '#bazaar dirstate flat format 1\n', \

557

'invalid header line: %r' % (header,)

558

adler_line = self._state_file.readline()

559

assert adler_line.startswith('adler32: '), 'missing adler32 checksum'

560

self.adler_expected = int(adler_line[len('adler32: '):-1])

561

num_entries_line = self._state_file.readline()

562

assert num_entries_line.startswith('num_entries: '), 'missing num_entries line'

563

self._num_entries = int(num_entries_line[len('num_entries: '):-1])

564

565

def _row_to_line(self, row):

566

"""Serialize row to a NULL delimited line ready for _get_output_lines.

567

568

:param row: A row_tuple as defined in the module docstring.

569

"""

570

entire_row = list(row[0])

571

for parent_number, parent_data in enumerate(row[1]):

572

# (revision, kind, dirname, basename, size, executable_bool, sha1)

573

entire_row.extend(parent_data)

574

# minikind conversion of the parent

575

parent_offset = 7 + parent_number * 7

576

entire_row[parent_offset + 1] = DirState._kind_to_minikind[parent_data[1]]

577

entire_row[parent_offset + 4] = str(parent_data[4])

578

entire_row[parent_offset + 5] = DirState._to_yesno[parent_data[5]]

579

# conversion from memory to disk-ready format:

580

# minikind conversion of the current row type.

581

entire_row[2] = DirState._kind_to_minikind[entire_row[2]]

582

entire_row[4] = str(entire_row[4])

583

# minikind of parents

584

return '\0'.join(entire_row)

585

586

def _rows_to_current_state(self, new_rows):

587

"""Load new_rows into self._root_row and self.dirblocks.

588

589

Process new_rows into the current state object, making them the active

590

state.

591

592

:param new_rows: A sorted list of rows. This function does not sort

593

to prevent unneeded overhead when callers have a sorted list

594

already.

595

:return: Nothing.

596

"""

597

assert new_rows[0][0][0:2] == ('', ''), \

598

"Incorrect root row %r" % new_rows[0][0]

599

self._root_row = new_rows[0]

600

self._dirblocks = [('', [])]

601

for row in new_rows[1:]:

602

if row[0] != self._dirblocks[-1][0]:

603

# new block

604

self._dirblocks.append((row[0][0], []))

605

# append the row to the current block

606

self._dirblocks[-1][1].append(row)

607

608

def save(self):

609

"""Save any pending changes created during this session."""

610

if (self._header_state == DirState.IN_MEMORY_MODIFIED or

611

self._dirblock_state == DirState.IN_MEMORY_MODIFIED):

612

self._state_file.seek(0)

613

self._state_file.writelines(self.get_lines())

614

self._state_file.flush()

615

self._state_file.truncate()

616

self._header_state = DirState.IN_MEMORY_UNMODIFIED

617

self._dirblock_state = DirState.IN_MEMORY_UNMODIFIED

618

619

def _set_data(self, parent_ids, root_row, dirblocks):

620

"""Set the full dirstate data in memory.

621

622

This is an internal function used to completely replace the objects

623

in memory state. It puts the dirstate into state 'full-dirty'.

624

625

:param parent_ids: A list of parent tree revision ids.

626

:param root_row: The root row - a tuple of the root direntry and the

627

list of matching direntries from the parent_ids trees.

628

:param dirblocks: A list containing one tuple for each directory in the

629

tree. Each tuple contains the directory path and a list of

630

row data in the same format as root_row.

631

"""

632

# our memory copy is now authoritative.

633

self._dirblocks = dirblocks

634

self._root_row = root_row

635

self._header_state = DirState.IN_MEMORY_MODIFIED

636

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

637

self._parents = list(parent_ids)

638

639

def set_path_id(self, path, new_id):

640

"""Change the id of path to new_id.

641

642

:param path: The path inside the tree to set - '' is the root, 'foo'

643

is the path foo in the root.

644

:param new_id: The new id to assign to the path. If unicode, it will

645

be encoded to utf8. In future this will be deprecated: avoid using

646

unicode ids if possible.

647

"""

648

self._read_header_if_needed()

649

if len(path) or len(self._parents):

650

# logic not written

651

raise NotImplementedError(self.set_path_id)

652

self._read_dirblocks_if_needed()

653

if new_id.__class__ == unicode:

654

new_id = new_id.encode('utf8')

655

root_info, root_parents = self._root_row

656

self._root_row = (root_info[0:3] + (new_id, ) + root_info[4:7]), root_parents

657

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

658

659

def set_parent_trees(self, trees, ghosts):

660

"""Set the parent trees for the dirstate.

661

662

:param trees: A list of revision_id, tree tuples. tree must be provided

663

even if the revision_id refers to a ghost: supply an empty tree in

664

this case.

665

:param ghosts: A list of the revision_ids that are ghosts at the time

666

of setting.

667

"""

668

# TODO: generate a list of parent indexes to preserve to save

669

# processing specific parent trees. In the common case one tree will

670

# be preserved - the left most parent.

671

# TODO: if the parent tree is a dirstate, we might want to walk them

672

# all by path in parallel for 'optimal' common-case performance.

673

# generate new root row.

674

self._read_dirblocks_if_needed()

675

old_root = self._root_row

676

root_info = self._root_row[0]

677

new_parent_count = len(trees)

678

# sketch: loop over all rows in the dirstate, cherry picking

679

# entries from the parent trees, if they are not ghosts.

680

# after we finish walking the dirstate, all entries not in the dirstate

681

# are deletes, so we want to append them to the end as per the design

682

# discussions. So do a set difference on ids with the parents to

683

# get deletes, and add them to the end.

684

new_rows = []

685

# skip ghost trees, as they dont get represented.

686

parent_trees = [tree for rev_id, tree in trees if rev_id not in ghosts]

687

parent_tree_count = len(parent_trees)

688

# loop over existing entries in the dirstate.

689

checked_ids = set()

690

for entry, old_parents in self._iter_rows():

691

file_id = entry[3]

692

checked_ids.add(file_id)

693

new_parents = [None] * parent_tree_count

694

for position, parent_tree in enumerate(parent_trees):

695

# revision_utf8, KIND, dirname, basename, size, executable, sha

696

new_parents[position] = self._parent_info(parent_tree, file_id)

697

assert None not in new_parents

698

new_rows.append((entry, new_parents))

699

# get additional ids that are present in parents and not in this tree.

700

deleted_ids = set()

701

for tree in parent_trees:

702

deleted_ids.update(set(tree.inventory._byid).difference(checked_ids))

703

# add the deleted ids to the dirstate. deleted files are represented as

704

# a file with dirname '', basename ''

705

for file_id in deleted_ids:

706

# add these ids to the deleted block

707

checked_ids.add(file_id)

708

# deleted items have a synthetic entry.

709

entry = ('/', 'RECYCLED.BIN', 'file', file_id.encode('utf8'), 0,

710

DirState.NULLSTAT, '')

711

new_parents = [None] * parent_tree_count

712

for position, parent_tree in enumerate(parent_trees):

713

# revision_utf8, KIND, dirname, basename, size, executable, sha

714

new_parents[position] = self._parent_info(parent_tree, file_id)

715

assert None not in new_parents

716

new_rows.append((entry, new_parents))

717

718

# sort all the rows

719

new_rows = sorted(new_rows)

720

self._rows_to_current_state(new_rows)

721

self._parents = [rev_id for rev_id, tree in trees]

722

self._ghosts = list(ghosts)

723

self._header_state = DirState.IN_MEMORY_MODIFIED

724

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

725

726

def set_state_from_inventory(self, new_inv):

727

"""Set new_inv as the current state.

728

729

:param new_inv: The inventory object to set current state from.

730

"""

731

self._read_dirblocks_if_needed()

732

# sketch:

733

# generate a byid index of the dirstate

734

parent_rows = {}

735

for row, parents in self._iter_rows():

736

parent_rows[row[3]] = parents

737

# walk the new inventory in directory order, copying parent data

738

# from the id index

739

new_rows = []

740

for path, entry in new_inv.iter_entries_by_dir():

741

dirname, basename = os.path.split(path.encode('utf8'))

742

kind = entry.kind

743

fileid_utf8 = entry.file_id.encode('utf8')

744

if kind == 'file':

745

size = entry.text_size or 0

746

sha1 = entry.text_sha1 or ''

747

elif kind == 'symlink':

748

size = 0

749

sha1 = (entry.symlink_target or '').encode('utf8')

750

else:

751

size = 0

752

sha1 = ''

753

try:

754

parents = parent_rows[fileid_utf8]

755

del parent_rows[fileid_utf8]

756

except KeyError:

757

parents = []

758

new_row = (dirname, basename, kind, fileid_utf8, size, DirState.NULLSTAT, sha1), parents

759

new_rows.append(new_row)

760

# append deleted data to the end of the tree as usual.

761

for fileid_utf8, parents in parent_rows.items():

762

if not parents:

763

# this row was only present in the old state, had no parents

764

continue

765

# deleted items have a synthetic entry.

766

new_row = ('/', 'RECYCLED.BIN', 'file', fileid_utf8, 0,

767

DirState.NULLSTAT, ''), parents

768

new_rows.append(new_row)

769

770

# sort all the rows (the ones in parents not in current may be unsorted)

771

new_rows = sorted(new_rows)

772

self._rows_to_current_state(new_rows)

773

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

774

775

776

def pack_stat(st, _encode=base64.encodestring, _pack=struct.pack):

777

"""Convert stat values into a packed representation."""

778

# jam 20060614 it isn't really worth removing more entries if we

779

# are going to leave it in packed form.

780

# With only st_mtime and st_mode filesize is 5.5M and read time is 275ms

781

# With all entries filesize is 5.9M and read time is mabye 280ms

782

# well within the noise margin

783

784

# base64.encode always adds a final newline, so strip it off

785

return _encode(_pack('>llllll'

786

, st.st_size, st.st_mtime, st.st_ctime

787

, st.st_dev, st.st_ino, st.st_mode))[:-1]

788

Older »