/brz/remove-bazaar : revision 2255.2.83

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/dirstate.py

Committer: John Arbash Meinel
Date: 2007-02-17 03:34:50 UTC
mfrom: (2294 +trunk)
mto: (2255.5.1 dirstate) (2321.1.1 integration)
mto: This revision was merged to the branch mainline in revision 2322.
Revision ID: john@arbash-meinel.com-20070217033450-q6dtvrwl24ckzg5o

[merge] bzr.dev 2294

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/HttpServer.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/smart.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/README.1st

doc/bazaar-vcs.org.kid

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/http_smart_server.txt

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

doc/version_info.txt

generate_docs.py

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

dir.py

dulwich

dulwich/.bzrignore

dulwich/COPYING

dulwich/Makefile

dulwich/README

dulwich/bin

dulwich/bin/dul-daemon

dulwich/bin/dul-receive-pack

dulwich/bin/dul-upload-pack

dulwich/bin/dulwich

dulwich/docs

dulwich/docs/protocol.txt

dulwich/dulwich

dulwich/dulwich/__init__.py

dulwich/dulwich/client.py

dulwich/dulwich/commit.py

dulwich/dulwich/errors.py

dulwich/dulwich/objects.py

dulwich/dulwich/pack.py

dulwich/dulwich/protocol.py

dulwich/dulwich/repo.py

dulwich/dulwich/server.py

dulwich/dulwich/tests

dulwich/dulwich/tests/__init__.py

dulwich/dulwich/tests/data

dulwich/dulwich/tests/data/blobs

dulwich/dulwich/tests/data/blobs/6f670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/blobs/954a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/blobs/e69de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/commits

dulwich/dulwich/tests/data/commits/0d89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/commits/5dac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/commits/60dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/packs

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.idx

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.pack

dulwich/dulwich/tests/data/repos

dulwich/dulwich/tests/data/repos/a

dulwich/dulwich/tests/data/repos/a/.git

dulwich/dulwich/tests/data/repos/a/.git/HEAD

dulwich/dulwich/tests/data/repos/a/.git/index

dulwich/dulwich/tests/data/repos/a/.git/objects

dulwich/dulwich/tests/data/repos/a/.git/objects/2a

dulwich/dulwich/tests/data/repos/a/.git/objects/2a/72d929692c41d8554c07f6301757ba18a65d91

dulwich/dulwich/tests/data/repos/a/.git/objects/4e

dulwich/dulwich/tests/data/repos/a/.git/objects/4e/f30bbfe26431a69c3820d3a683df54d688f2ec

dulwich/dulwich/tests/data/repos/a/.git/objects/4f

dulwich/dulwich/tests/data/repos/a/.git/objects/4f/2e6529203aa6d44b5af6e3292c837ceda003f9

dulwich/dulwich/tests/data/repos/a/.git/objects/7d

dulwich/dulwich/tests/data/repos/a/.git/objects/7d/9a07d797595ef11344549b8d08198e48c15364

dulwich/dulwich/tests/data/repos/a/.git/objects/a2

dulwich/dulwich/tests/data/repos/a/.git/objects/a2/96d0bb611188cabb256919f36bc30117cca005

dulwich/dulwich/tests/data/repos/a/.git/objects/a9

dulwich/dulwich/tests/data/repos/a/.git/objects/a9/0fa2d900a17e99b433217e988c4eb4a2e9a097

dulwich/dulwich/tests/data/repos/a/.git/objects/ff

dulwich/dulwich/tests/data/repos/a/.git/objects/ff/d47d45845a8f6576491e1edb97e3fe6a850e7f

dulwich/dulwich/tests/data/repos/a/.git/objects/info

dulwich/dulwich/tests/data/repos/a/.git/objects/pack

dulwich/dulwich/tests/data/repos/a/.git/refs

dulwich/dulwich/tests/data/repos/a/.git/refs/heads

dulwich/dulwich/tests/data/repos/a/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/a/.git/refs/tags

dulwich/dulwich/tests/data/repos/a/a

dulwich/dulwich/tests/data/repos/a/b

dulwich/dulwich/tests/data/repos/a/c

dulwich/dulwich/tests/data/repos/ooo_merge

dulwich/dulwich/tests/data/repos/ooo_merge/.git

dulwich/dulwich/tests/data/repos/ooo_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/ooo_merge/.git/index

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38/74e9c60a6d149c44c928140f250d81e6381520

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76/01d7f6231db6a57f7bbb79ee52e4d462fd44d1

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2/a2766a2879c209ab1176e7e778b81ae422eeaa

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5/07291b64138b875c28e03469025b1ea20bc614

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9/e39b120c68182a4ba35349f832d0e4e61f485c

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb/5b0425c7ce46959bec94d54b9a157645e114f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/ooo_merge/a

dulwich/dulwich/tests/data/repos/ooo_merge/b

dulwich/dulwich/tests/data/repos/ooo_merge/c

dulwich/dulwich/tests/data/repos/simple_merge

dulwich/dulwich/tests/data/repos/simple_merge/.git

dulwich/dulwich/tests/data/repos/simple_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/simple_merge/.git/index

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d/89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b/6318f651a534b38f9c7aedeebbd56c1e896853

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c/ffe90e0a41ad3f5190079d7c8f036bde29cbe6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d/ac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60/dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab/64bbdcc51b170d21588e5c5d391ee5c0c96dfd

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4/bdad6549dfedf25d3b89d21f506aff575b28a7

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8/0c186a03f423a81b39df39dc87fd269736ca86

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/simple_merge/a

dulwich/dulwich/tests/data/repos/simple_merge/b

dulwich/dulwich/tests/data/repos/simple_merge/d

dulwich/dulwich/tests/data/repos/simple_merge/e

dulwich/dulwich/tests/data/trees

dulwich/dulwich/tests/data/trees/70c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/test_objects.py

dulwich/dulwich/tests/test_pack.py

dulwich/dulwich/tests/test_repository.py

dulwich/setup.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

remote.py

repository.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_ids.py

tests/test_repository.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/dirstate.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""DirState objects record the state of a directory and its bzr metadata.

Pseduo EBNF grammar for the disk format:

MINIKIND = "f" | "d" | "l";

NL = "\n";

NULL = "\0";

WHOLE NUMBER = {digit}, digit;

dirstate format = header line, full checksum, row count, parent details,

ghost_details, rows;

header line = "#bazaar dirstate flat format 1", NL;

full checksum = "adler32: ", ["-"], WHOLE NUMBER, NL;

row count = "num_entries: ", digit, NL;

parent_details = WHOLE NUMBER, NULL, NL; XXX: complete this line

ghost_details = WHOLE NUMBER, NULL, {GHOST_ID NULL}*, NL;

rows = dirname, NULL, basename, NULL, MINIKIND, NULL, fileid_utf8, NULL,

WHOLE NUMBER (* size *), NULL, packed stat, NULL, sha1|symlink target,

{PARENT ROW}

PARENT ROW = NULL, revision_utf8, NULL, MINIKIND, NULL, dirname, NULL,

basename, NULL, WHOLE NUMBER (* size *), NULL, "y" | "n", NULL,

SHA1

PARENT ROW's are emitted for every parent that is not in the ghosts details

line. That is, if the parents are foo, bar, baz, and the ghosts are bar, then

each row will have a PARENT ROW for foo and baz, but not for bar.

----

Design priorities:

1) Fast end to end use for bzr's top 5 uses cases.

2) fall back current object model as needed.

3) scale usably to the largest trees known today - say 50K entries.

Locking:

Eventually reuse dirstate objects across locks IFF the dirstate file has not

been modified, but will require that we flush/ignore cached stat-hit data

because we wont want to restat all files on disk just because a lock was

acquired, yet we cannot trust the data after the previous lock was released.

Memory representation:

vecter of all directories, and vector of the childen ?

i.e.

root_row = (direntry for root, [parent_direntries_for_root]),

dirblocks = [

('', ['data for achild', 'data for bchild', 'data for cchild'])

('dir', ['achild', 'cchild', 'echild'])

]

- single bisect to find N subtrees from a path spec

- in-order for serialisation - this is 'dirblock' grouping.

- insertion of a file '/a' affects only the '/' child-vector, that is, to

insert 10K elements from scratch does not generates O(N^2) memoves of a

single vector, rather each individual, which tends to be limited to a

manageable number. Will scale badly on trees with 10K entries in a

single directory. compare with Inventory.InventoryDirectory which has

a dictionary for the children. No bisect capability, can only probe for

exact matches, or grab all elements and sorta.

- Whats the risk of error here? Once we have the base format being processed

we should have a net win regardless of optimality. So we are going to

go with what seems reasonably.

open questions:

maybe we should do a test profile of these core structure - 10K simulated searches/lookups/etc?

Objects for each row?

The lifetime of Dirstate objects is current per lock, but see above for

possible extensions. The lifetime of a row from a dirstate is expected to be

very short in the optimistic case: which we are optimising for. For instance,

subtree status will determine from analysis of the disk data what rows need to

be examined at all, and will be able to determine from a single row whether

that file has altered or not, so we are aiming to process tens of thousands of

entries each second within the dirstate context, before exposing anything to

the larger codebase. This suggests we want the time for a single file

comparison to be < 0.1 milliseconds. That would give us 10000 paths per second

processed, and to scale to 100 thousand we'll another order of magnitude to do

that. Now, as the lifetime for all unchanged entries is the time to parse, stat

the file on disk, and then immediately discard, the overhead of object creation

becomes a significant cost.

Figures: Creating a tuple from from 3 elements was profiled at 0.0625

microseconds, whereas creating a object which is subclassed from tuple was

0.500 microseconds, and creating an object with 3 elements and slots was 3

microseconds long. 0.1 milliseconds is 100 microseconds, and ideally we'll get

100

down to 10 microseconds for the total processing - having 33% of that be object

101

creation is a huge overhead. There is a potential cost in using tuples within

102

each row which is that the conditional code to do comparisons may be slower

103

than method invocation, but method invocation is known to be slow due to stack

104

frame creation, so avoiding methods in these tight inner loops in unfortunately

105

desirable. We can consider a pyrex version of this with objects in future if

106

desired.

107

108

"""

109

110

111

import base64

112

import bisect

113

import cStringIO

114

import os

115

import sha

116

import struct

117

import zlib

118

119

from bzrlib import (

120

errors,

121

trace,

122

)

123

import bzrlib.inventory

124

from bzrlib import osutils

125

from bzrlib.osutils import (

126

pathjoin,

127

sha_file,

128

sha_string,

129

walkdirs,

130

)

131

132

133

class DirState(object):

134

"""Record directory and metadata state for fast access.

135

136

A dirstate is a specialised data structure for managing local working

137

tree state information. Its not yet well defined whether it is platform

138

specific, and if it is how we detect/parameterise that.

139

"""

140

141

_kind_to_minikind = {'file':'f', 'directory':'d', 'symlink':'l'}

142

_minikind_to_kind = {'f':'file', 'd':'directory', 'l':'symlink'}

143

_to_yesno = {True:'y', False: 'n'} # TODO profile the performance gain

144

# of using int conversion rather than a dict here. AND BLAME ANDREW IF

145

# it is faster.

146

147

NOT_IN_MEMORY = 0

148

IN_MEMORY_UNMODIFIED = 1

149

IN_MEMORY_MODIFIED = 2

150

151

NULLSTAT = 'x' * 32

152

NULL_PARENT_ROW = ('', 'file', '/', 'RECYCLED.BIN', 0, False, '')

153

154

def __init__(self):

155

"""Create a DirState object.

156

157

Attributes of note:

158

159

:attr _root_row: The root row of the directory/file information,

160

- contains the path to / - '', ''

161

- kind of 'directory',

162

- the file id of the root in utf8

163

- size of 0

164

- a packed state

165

- and no sha information.

166

"""

167

# _header_state and _dirblock_state represent the current state

168

# of the dirstate metadata and the per-row data respectiely.

169

# NOT_IN_MEMORY indicates that no data is in memory

170

# IN_MEMORY_UNMODIFIED indicates that what we have in memory

171

# is the same as is on disk

172

# IN_MEMORY_MODIFIED indicates that we have a modified version

173

# of what is on disk.

174

# In future we will add more granularity, for instance _dirblock_state

175

# will probably support partially-in-memory as a separate variable,

176

# allowing for partially-in-memory unmodified and partially-in-memory

177

# modified states.

178

self._header_state = DirState.NOT_IN_MEMORY

179

self._dirblock_state = DirState.NOT_IN_MEMORY

180

self._dirblocks = []

181

self._ghosts = []

182

self._parents = []

183

self._root_row = None

184

self._state_file=None

185

186

def add(self, path, file_id, kind, stat, link_or_sha1):

187

"""Add a path to be tracked.

188

189

:param path: The path within the dirstate - '' is the root, 'foo' is the

190

path foo within the root, 'foo/bar' is the path bar within foo

191

within the root.

192

:param file_id: The file id of the path being added.

193

:param kind: The kind of the path.

194

:param stat: The output of os.lstate for the path.

195

:param link_or_sha1: The sha value of the file, or the target of a

196

symlink. '' for directories.

197

"""

198

# adding a file:

199

# find the block its in.

200

# find the location in the block.

201

# check its not there

202

# add it.

203

#------- copied from bzrlib.inventory.make_entry

204

# --- normalized_filename wants a unicode basename only, so get one.

205

dirname, basename = os.path.split(path)

206

# we dont import normalized_filename directly because we want to be

207

# able to change the implementation at runtime for tests.

208

norm_name, can_access = osutils.normalized_filename(basename)

209

if norm_name != basename:

210

if can_access:

211

basename = norm_name

212

else:

213

raise errors.InvalidNormalization(path)

214

# now that we've normalised, we need the correct utf8 path and

215

# dirname and basename elements. This single encode and split should be

216

# faster than three separate encodes.

217

utf8path = (dirname + '/' + basename).strip('/').encode('utf8')

218

dirname, basename = os.path.split(utf8path)

219

self._read_dirblocks_if_needed()

220

block_index = self._find_dirblock_index(dirname)

221

if block_index < 0:

222

# some parent path has not been added - its an error to add this

223

# child

224

raise errors.NotVersionedError(path, str(self))

225

block = self._dirblocks[block_index][1]

226

if stat is None:

227

size = 0

228

packed_stat = DirState.NULLSTAT

229

else:

230

size = stat.st_size

231

packed_stat = pack_stat(stat)

232

parent_info = self._empty_parent_info()

233

if kind == 'file':

234

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

235

size, packed_stat, link_or_sha1), parent_info)

236

elif kind == 'directory':

237

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

238

0, packed_stat, ''), parent_info)

239

elif kind == 'symlink':

240

row_data = ((dirname, basename, kind, file_id.encode('utf8'),

241

size, packed_stat, link_or_sha1), parent_info)

242

else:

243

raise errors.BzrError('unknown kind %r' % kind)

244

row_index = bisect.bisect_left(block, row_data)

245

if len(block) > row_index:

246

assert block[row_index][0][1] != basename, \

247

"basename %r already added" % basename

248

block.insert(row_index, row_data)

249

250

if kind == 'directory':

251

# insert a new dirblock

252

self._ensure_block(block_index, row_index, utf8path)

253

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

254

255

def add_deleted(self, fileid_utf8, parents):

256

"""Add fileid_utf8 with parents as deleted."""

257

self._read_dirblocks_if_needed()

258

new_row = self._make_deleted_row(fileid_utf8, parents)

259

block_index = self._find_dirblock_index(new_row[0][0])

260

if block_index < 0:

261

# no deleted block yet.

262

bisect.insort_left(self._dirblocks, (new_row[0][0], []))

263

block_index = self._find_dirblock_index(new_row[0][0])

264

block = self._dirblocks[block_index][1]

265

row_index = bisect.insort_left(block, new_row)

266

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

267

268

def _empty_parent_info(self):

269

return [DirState.NULL_PARENT_ROW] * (len(self._parents) -

270

len(self._ghosts))

271

272

def _ensure_block(self, parent_block_index, parent_row_index, dirname):

273

"""Enssure a block for dirname exists.

274

275

This function exists to let callers which know that there is a

276

directory dirname ensure that the block for it exists. This block can

277

fail to exist because of demand loading, or because a directory had no

278

children. In either case it is not an error. It is however an error to

279

call this if there is no parent entry for the directory, and thus the

280

function requires the coordinates of such an entry to be provided.

281

282

The root row is special cased and can be indicated with a parent block

283

and row index of -1

284

285

:param parent_block_index: The index of the block in which dirname's row

286

exists.

287

:param parent_row_index: The index in the parent block where the row

288

exists.

289

:param dirname: The utf8 dirname to ensure there is a block for.

290

:return: The index for the block.

291

"""

292

# the basename of the directory must be the end of its full name.

293

if not (parent_block_index == -1 and

294

parent_block_index == -1 and dirname == ''):

295

assert dirname.endswith(

296

self._dirblocks[parent_block_index][1][parent_row_index][0][1])

297

## In future, when doing partial parsing, this should load and

298

# populate the entire block.

299

index = bisect.bisect_left(self._dirblocks, (dirname, []))

300

if (index == len(self._dirblocks) or

301

self._dirblocks[index][0] != dirname):

302

self._dirblocks.insert(index, (dirname, []))

303

return index

304

305

def _find_dirblock_index(self, dirname):

306

"""Find the dirblock index for dirname.

307

308

:return: -1 if the dirname is not present, or the index in

309

self._dirblocks for it otherwise.

310

"""

311

block_index = bisect.bisect_left(self._dirblocks, (dirname, []))

312

if (block_index == len(self._dirblocks) or

313

self._dirblocks[block_index][0] != dirname):

314

return -1

315

return block_index

316

317

@staticmethod

318

def from_tree(tree, dir_state_filename):

319

"""Create a dirstate from a bzr Tree.

320

321

:param tree: The tree which should provide parent information and

322

inventory ids.

323

"""

324

tree.lock_read()

325

# XXX: aka the big ugly.

326

result = DirState()

327

result._state_file = open(dir_state_filename, 'wb+')

328

329

_encode = base64.encodestring

330

331

parent_ids = tree.get_parent_ids()

332

num_parents = len(parent_ids)

333

if num_parents > 3:

334

raise ValueError('Cannot handle more than 3 parents')

335

336

parent_trees = []

337

for parent_id in parent_ids:

338

parent_trees.append(tree.branch.repository.revision_tree(parent_id))

339

340

# FIXME: is this utf8 safe?

341

342

to_minikind = DirState._kind_to_minikind

343

to_yesno = DirState._to_yesno

344

345

st = os.lstat(tree.basedir)

346

root_info = (

347

'', '' # No path

348

, 'directory', tree.inventory.root.file_id.encode('utf8')

349

, 0 # no point having a size for dirs.

350

, pack_stat(st)

351

, '' # No sha

352

)

353

root_parents = []

354

for parent_tree in parent_trees:

355

root_parents.append((

356

parent_tree.inventory.root.revision.encode('utf8'),

357

'directory', '',

358

'',

359

'',

360

False,

361

'',

362

))

363

364

root_row = (root_info, root_parents)

365

dirblocks = []

366

for dirinfo, block in tree.walkdirs():

367

# dirinfo is path, id

368

to_remove = []

369

# add the row for this block

370

block_row = []

371

dirblocks.append((dirinfo[0], block_row))

372

for relpath, name, kind, st, fileid, versionedkind in block:

373

if fileid is None:

374

# unversioned file, skip

375

continue

376

# TODO? factor out this loop body as a helper function ?

377

s = None

378

dirname, basename = os.path.split(relpath.encode('utf8'))

379

if kind == 'file':

380

s = tree.get_file_sha1(fileid, relpath)

381

elif kind == 'directory':

382

if name in ('.bzr', '.hg', 'CVS', '.svn', '_svn'):

383

raise Exception('skipping dirs not supported yet')

384

# Skip this, and all children

385

to_remove.append((relpath, name, kind, st, abspath))

386

continue

387

# no sha value

388

s = ''

389

elif kind == 'symlink':

390

# sha value of the link target ?!

391

s = os.readlink(abspath)

392

parent_info = []

393

for count in xrange(num_parents):

394

parent_info.append(

395

result._parent_info(parent_trees[count], fileid))

396

row_data = (dirname.encode('utf8'), basename.encode('utf8'),

397

kind, fileid.encode('utf8'), st.st_size, pack_stat(st),

398

399

block_row.append((row_data, parent_info))

400

401

# It isn't safe to remove entries while we are iterating

402

# over the same list, so remove them now

403

for entry in to_remove:

404

block.remove(entry)

405

406

#lines.append(result._get_parents_line(parent_ids))

407

#lines.append(result._get_ghosts_line([]))

408

result._set_data(parent_ids, root_row, dirblocks)

409

result.save()

410

tree.unlock()

411

return result

412

413

def get_ghosts(self):

414

"""Return a list of the parent tree revision ids that are ghosts."""

415

self._read_header_if_needed()

416

return self._ghosts

417

418

def get_lines(self):

419

"""Serialise the entire dirstate to a sequence of lines."""

420

if (self._header_state == DirState.IN_MEMORY_UNMODIFIED and

421

self._dirblock_state == DirState.IN_MEMORY_UNMODIFIED):

422

# read whats on disk.

423

self._state_file.seek(0)

424

return self._state_file.readlines()

425

lines = []

426

lines.append(self._get_parents_line(self.get_parent_ids()))

427

lines.append(self._get_ghosts_line(self._ghosts))

428

# append the root line which is special cased

429

lines.extend(map(self._row_to_line, self._iter_rows()))

430

return self._get_output_lines(lines)

431

432

def _get_ghosts_line(self, ghost_ids):

433

"""Create a line for the state file for ghost information."""

434

return '\0'.join([str(len(ghost_ids))] +

435

[g.encode('utf8') for g in ghost_ids])

436

437

def _get_parents_line(self, parent_ids):

438

"""Create a line for the state file for parents information."""

439

return '\0'.join([str(len(parent_ids))] +

440

[p.encode('utf8') for p in parent_ids])

441

442

def get_parent_ids(self):

443

"""Return a list of the parent tree ids for the directory state."""

444

self._read_header_if_needed()

445

return list(self._parents)

446

447

def _get_row(self, path_utf8):

448

"""Get the dirstate row for path.

449

450

:param path_utf8: An utf8 path to be looked up.

451

:return: The dirstate row tuple for path, or (None, None)

452

"""

453

self._read_dirblocks_if_needed()

454

if path_utf8 == '':

455

return self._root_row

456

dirname, basename = os.path.split(path_utf8)

457

block_index, row_index, dir_present, file_present = \

458

self._get_block_row_index(dirname, basename)

459

if not file_present:

460

return None, None

461

row = self._dirblocks[block_index][1][row_index]

462

assert row[0][3], 'unversioned row?!?!'

463

return row

464

465

def _get_block_row_index(self, dirname, basename):

466

"""Get the coordinates for a path in the state structure.

467

468

:param dirname: The utf8 dirname to lookup.

469

:param basename: The utf8 basename to lookup.

470

:return: A tuple describing where the path is located, or should be

471

inserted. The tuple contains four fields: the block index, the row

472

index, anda two booleans are True when the directory is present, and

473

when the entire path is present. There is no guarantee that either

474

coordinate is currently reachable unless the found field for it is

475

True. For instance, a directory not present in the state may be

476

returned with a value one greater than the current highest block

477

offset. The directory present field will always be True when the

478

path present field is True.

479

"""

480

assert not (dirname == '' and basename == ''), 'blackhole lookup error'

481

self._read_dirblocks_if_needed()

482

block_index = bisect.bisect_left(self._dirblocks, (dirname, []))

483

if (block_index == len(self._dirblocks) or

484

self._dirblocks[block_index][0] != dirname):

485

# no such directory - return the dir index and 0 for the row.

486

return block_index, 0, False, False

487

block = self._dirblocks[block_index][1] # access the rows only

488

search = ((dirname, basename), [])

489

row_index = bisect.bisect_left(block, search)

490

if row_index == len(block) or block[row_index][0][1] != basename:

491

return block_index, row_index, True, False

492

return block_index, row_index, True, True

493

494

@staticmethod

495

def initialize(path):

496

"""Create a new dirstate on path.

497

498

The new dirstate will be an empty tree - that is it has no parents,

499

and only a root node - which has id ROOT_ID.

500

501

:param path: The name of the file for the dirstate.

502

:return: A DirState object.

503

"""

504

# This constructs a new DirState object on a path, sets the _state_file

505

# to a new empty file for that path. It then calls _set_data() with our

506

# stock empty dirstate information - a root with ROOT_ID, no children,

507

# and no parents. Finally it calls save() to ensure that this data will

508

# persist.

509

result = DirState()

510

result._state_file = open(path, 'wb+')

511

# a new root directory, with a pack_stat (the x's) that is just noise and will

512

# never match the output of base64 encode.

513

root_row_data = ('', '', 'directory', bzrlib.inventory.ROOT_ID, 0,

514

DirState.NULLSTAT, '')

515

root_parents = []

516

root_row = (root_row_data, root_parents)

517

empty_tree_dirblocks = [('', [])] # root dir contents - no entries.

518

result._set_data([], root_row, empty_tree_dirblocks)

519

try:

520

result.save()

521

except:

522

result._state_file.close()

523

raise

524

return result

525

526

def _iter_rows(self):

527

"""Iterate over all the row data in the dirstate.

528

529

Each yelt item is a tuple of (row_data, parent_data_list).

530

"""

531

self._read_dirblocks_if_needed()

532

yield self._root_row

533

for directory in self._dirblocks:

534

for row in directory[1]:

535

yield row

536

537

def _get_output_lines(self, lines):

538

"""format lines for final output.

539

540

:param lines: A sequece of lines containing the parents list and the

541

path lines.

542

"""

543

output_lines = ['#bazaar dirstate flat format 1\n']

544

lines.append('') # a final newline

545

inventory_text = '\0\n\0'.join(lines)

546

output_lines.append('adler32: %s\n' % (zlib.adler32(inventory_text),))

547

# -3, 1 for num parents, 1 for ghosts, 1 for final newline

548

num_entries = len(lines)-3

549

output_lines.append('num_entries: %s\n' % (num_entries,))

550

output_lines.append(inventory_text)

551

return output_lines

552

553

def _make_deleted_row(self, fileid_utf8, parents):

554

"""Return a deleted for for fileid_utf8."""

555

return ('/', 'RECYCLED.BIN', 'file', fileid_utf8, 0, DirState.NULLSTAT,

556

''), parents

557

558

@staticmethod

559

def on_file(path):

560

"""Construct a DirState on the file at path path."""

561

result = DirState()

562

result._state_file = open(path, 'rb+')

563

return result

564

565

def _parent_info(self, parent_tree, fileid):

566

"""Generate the parent information for file_id in parent_tree."""

567

# FIXME: This is probably expensive - we encode the path that in the

568

# common case will be the same across all parents, twice.

569

# also, id2path is slow in inventory, and we should make that fast.

570

try:

571

parent_entry = parent_tree.inventory[fileid]

572

except errors.NoSuchId:

573

# this parent does not have fileid - return a bogus entry, which

574

# will be filtered out on iteration etc.

575

# an empty revision id is bogus and safe to put on disk

576

# we make it be a 'file', just because. We give it the

577

# deleted file path dirname and basename, 0 size, not executable

578

# and no sha1.

579

return DirState.NULL_PARENT_ROW

580

parent_path = parent_tree.inventory.id2path(fileid)

581

dirname, basename = os.path.split(parent_path.encode('utf8'))

582

return (parent_entry.revision.encode('utf8'),

583

parent_entry.kind,

584

# FIXME: set these from the parent

585

dirname, basename,

586

parent_entry.text_size or 0,

587

parent_entry.executable,

588

parent_entry.text_sha1 or '',

589

)

590

591

def _read_dirblocks_if_needed(self):

592

"""Read in all the dirblocks from the file if they are not in memory."""

593

self._read_header_if_needed()

594

if self._dirblock_state == DirState.NOT_IN_MEMORY:

595

# the _state_file pointer will be positioned at the start of the

596

# dirblocks.

597

text = self._state_file.read()

598

# TODO: check the adler checksums. adler_measured = zlib.adler32(text)

599

600

fields = text.split('\0')

601

# Remove the last blank entry

602

trailing = fields.pop()

603

assert trailing == ''

604

# consider turning fields into a tuple.

605

606

# skip the first field which is the trailing null from the header.

607

cur = 1

608

# Each line now has an extra '\n' field which is not used

609

# so we just skip over it

610

# number of fields per dir_entry

611

# + number of fields per parent_entry

612

# + newline

613

num_present_parents = len(self._parents) - len(self._ghosts)

614

entry_size = 7 + (7 * (num_present_parents)) + 1

615

expected_field_count = entry_size * self._num_entries

616

if len(fields) - cur > expected_field_count:

617

fields = fields[:expected_field_count + cur]

618

trace.mutter('Unexpectedly long dirstate field count!')

619

print "XXX: incorrectly truncated dirstate file bug triggered."

620

field_count = len(fields)

621

# this checks our adjustment, and also catches file too short.

622

assert field_count - cur == expected_field_count, \

623

'field count incorrect %s != %s, entry_size=%s, '\

624

'num_entries=%s fields=%r' % (

625

field_count - cur, expected_field_count, entry_size,

626

self._num_entries, fields)

627

628

# Fast path the case where there are 1 or 2 parents

629

if num_present_parents == 0:

630

entries = [(fields[pos:pos+7], []) for pos in xrange(cur, field_count, entry_size)]

631

elif num_present_parents == 1:

632

entries = [(fields[pos:pos+7], [fields[pos+7:pos+14],])

633

for pos in xrange(cur, field_count, entry_size)]

634

elif num_present_parents == 2:

635

entries = [(fields[pos:pos+7], [

636

fields[pos+7:pos+14],

637

fields[pos+14:pos+21],])

638

for pos in xrange(cur, field_count, entry_size)]

639

else:

640

entries = [(

641

fields[pos:pos+7],

642

tuple([fields[chunk:chunk+7] for

643

chunk in xrange(pos + 7, pos+entry_size-1, 7)]))

644

for pos in xrange(cur, field_count, entry_size)

645

]

646

647

assert len(entries) == self._num_entries, '%s != %s entries' % (len(entries),

648

self._num_entries)

649

650

def _line_to_row(line):

651

"""Convert a freshly read line's size and minikind for use."""

652

# convert the minikind to kind

653

line[0][2] = self._minikind_to_kind[line[0][2]]

654

# convert the size to an int

655

line[0][4] = int(line[0][4])

656

for parent in line[1]:

657

parent[1] = self._minikind_to_kind[parent[1]]

658

parent[4] = int(parent[4])

659

parent[5] = parent[5] == 'y'

660

return tuple(line[0]), map(tuple, line[1])

661

new_rows = map(_line_to_row, entries)

662

self._rows_to_current_state(new_rows)

663

self._dirblock_state = DirState.IN_MEMORY_UNMODIFIED

664

665

def _read_header(self):

666

"""This reads in the metadata header, and the parent ids.

667

668

After reading in, the file should be positioned at the null

669

just before the start of the first record in the file.

670

671

:return: (expected adler checksum, number of entries, parent list)

672

"""

673

self._read_prelude()

674

parent_line = self._state_file.readline()

675

info = parent_line.split('\0')

676

num_parents = int(info[0])

677

assert num_parents == len(info)-2, 'incorrect parent info line'

678

self._parents = [p.decode('utf8') for p in info[1:-1]]

679

680

ghost_line = self._state_file.readline()

681

info = ghost_line.split('\0')

682

num_ghosts = int(info[1])

683

assert num_ghosts == len(info)-3, 'incorrect ghost info line'

684

self._ghosts = [p.decode('utf8') for p in info[2:-1]]

685

self._header_state = DirState.IN_MEMORY_UNMODIFIED

686

687

def _read_header_if_needed(self):

688

"""Read the header of the dirstate file if needed."""

689

if self._header_state == DirState.NOT_IN_MEMORY:

690

self._read_header()

691

692

def _read_prelude(self):

693

"""Read in the prelude header of the dirstate file

694

695

This only reads in the stuff that is not connected to the adler

696

checksum. The position will be correct to read in the rest of

697

the file and check the checksum after this point.

698

The next entry in the file should be the number of parents,

699

and their ids. Followed by a newline.

700

"""

701

header = self._state_file.readline()

702

assert header == '#bazaar dirstate flat format 1\n', \

703

'invalid header line: %r' % (header,)

704

adler_line = self._state_file.readline()

705

assert adler_line.startswith('adler32: '), 'missing adler32 checksum'

706

self.adler_expected = int(adler_line[len('adler32: '):-1])

707

num_entries_line = self._state_file.readline()

708

assert num_entries_line.startswith('num_entries: '), 'missing num_entries line'

709

self._num_entries = int(num_entries_line[len('num_entries: '):-1])

710

711

def _row_to_line(self, row):

712

"""Serialize row to a NULL delimited line ready for _get_output_lines.

713

714

:param row: A row_tuple as defined in the module docstring.

715

"""

716

entire_row = list(row[0])

717

for parent_number, parent_data in enumerate(row[1]):

718

# (revision, kind, dirname, basename, size, executable_bool, sha1)

719

entire_row.extend(parent_data)

720

# minikind conversion of the parent

721

parent_offset = 7 + parent_number * 7

722

entire_row[parent_offset + 1] = DirState._kind_to_minikind[parent_data[1]]

723

entire_row[parent_offset + 4] = str(parent_data[4])

724

entire_row[parent_offset + 5] = DirState._to_yesno[parent_data[5]]

725

# conversion from memory to disk-ready format:

726

# minikind conversion of the current row type.

727

entire_row[2] = DirState._kind_to_minikind[entire_row[2]]

728

entire_row[4] = str(entire_row[4])

729

# minikind of parents

730

return '\0'.join(entire_row)

731

732

def _rows_to_current_state(self, new_rows):

733

"""Load new_rows into self._root_row and self.dirblocks.

734

735

Process new_rows into the current state object, making them the active

736

state.

737

738

:param new_rows: A sorted list of rows. This function does not sort

739

to prevent unneeded overhead when callers have a sorted list

740

already.

741

:return: Nothing.

742

"""

743

assert new_rows[0][0][0:2] == ('', ''), \

744

"Incorrect root row %r" % new_rows[0][0]

745

self._root_row = new_rows[0]

746

self._dirblocks = [('', [])]

747

for row in new_rows[1:]:

748

if row[0][0] != self._dirblocks[-1][0]:

749

# new block

750

self._dirblocks.append((row[0][0], []))

751

# append the row to the current block

752

self._dirblocks[-1][1].append(row)

753

754

def save(self):

755

"""Save any pending changes created during this session.

756

757

We reuse the existing file, because that prevents race conditions with

758

file creation, and we expect to be using oslocks on it in the near

759

future to prevent concurrent modification and reads - because dirstates

760

incremental data aggretation is not compatible with reading a modified

761

file, and replacing a file in use by another process is impossible on

762

windows.

763

764

A dirstate in read only mode should be smart enough though to validate

765

that the file has not changed, and otherwise discard its cache and

766

start over, to allow for fine grained read lock duration, so 'status'

767

wont block 'commit' - for example.

768

"""

769

if (self._header_state == DirState.IN_MEMORY_MODIFIED or

770

self._dirblock_state == DirState.IN_MEMORY_MODIFIED):

771

self._state_file.seek(0)

772

self._state_file.writelines(self.get_lines())

773

self._state_file.truncate()

774

self._state_file.flush()

775

self._header_state = DirState.IN_MEMORY_UNMODIFIED

776

self._dirblock_state = DirState.IN_MEMORY_UNMODIFIED

777

778

def _set_data(self, parent_ids, root_row, dirblocks):

779

"""Set the full dirstate data in memory.

780

781

This is an internal function used to completely replace the objects

782

in memory state. It puts the dirstate into state 'full-dirty'.

783

784

:param parent_ids: A list of parent tree revision ids.

785

:param root_row: The root row - a tuple of the root direntry and the

786

list of matching direntries from the parent_ids trees.

787

:param dirblocks: A list containing one tuple for each directory in the

788

tree. Each tuple contains the directory path and a list of

789

row data in the same format as root_row.

790

"""

791

# our memory copy is now authoritative.

792

self._dirblocks = dirblocks

793

self._root_row = root_row

794

self._header_state = DirState.IN_MEMORY_MODIFIED

795

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

796

self._parents = list(parent_ids)

797

798

def set_path_id(self, path, new_id):

799

"""Change the id of path to new_id.

800

801

:param path: The path inside the tree to set - '' is the root, 'foo'

802

is the path foo in the root.

803

:param new_id: The new id to assign to the path. If unicode, it will

804

be encoded to utf8. In future this will be deprecated: avoid using

805

unicode ids if possible.

806

"""

807

# TODO: start warning here.

808

if new_id.__class__ == unicode:

809

new_id = new_id.encode('utf8')

810

self._read_dirblocks_if_needed()

811

if len(path):

812

import pdb;pdb.set_trace()

813

# logic not written

814

raise NotImplementedError(self.set_path_id)

815

# TODO: check new id is unique

816

if new_id == self._root_row[0][3]:

817

# the root id is unchanged

818

return

819

root_info, root_parents = self._root_row

820

if len(root_parents):

821

self.add_deleted(root_info[3], root_parents)

822

self._root_row = ((root_info[0:3] + (new_id, ) + root_info[4:7]),

823

self._empty_parent_info())

824

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

825

826

def set_parent_trees(self, trees, ghosts):

827

"""Set the parent trees for the dirstate.

828

829

:param trees: A list of revision_id, tree tuples. tree must be provided

830

even if the revision_id refers to a ghost: supply an empty tree in

831

this case.

832

:param ghosts: A list of the revision_ids that are ghosts at the time

833

of setting.

834

"""

835

# TODO: generate a list of parent indexes to preserve to save

836

# processing specific parent trees. In the common case one tree will

837

# be preserved - the left most parent.

838

# TODO: if the parent tree is a dirstate, we might want to walk them

839

# all by path in parallel for 'optimal' common-case performance.

840

# generate new root row.

841

self._read_dirblocks_if_needed()

842

old_root = self._root_row

843

root_info = self._root_row[0]

844

new_parent_count = len(trees)

845

# sketch: loop over all rows in the dirstate, cherry picking

846

# entries from the parent trees, if they are not ghosts.

847

# after we finish walking the dirstate, all entries not in the dirstate

848

# are deletes, so we want to append them to the end as per the design

849

# discussions. So do a set difference on ids with the parents to

850

# get deletes, and add them to the end.

851

new_rows = []

852

# skip ghost trees, as they dont get represented.

853

parent_trees = [tree for rev_id, tree in trees if rev_id not in ghosts]

854

parent_tree_count = len(parent_trees)

855

# loop over existing entries in the dirstate.

856

checked_ids = set()

857

for entry, old_parents in self._iter_rows():

858

file_id = entry[3]

859

checked_ids.add(file_id)

860

new_parents = [None] * parent_tree_count

861

for position, parent_tree in enumerate(parent_trees):

862

# revision_utf8, KIND, dirname, basename, size, executable, sha

863

new_parents[position] = self._parent_info(parent_tree, file_id)

864

assert None not in new_parents

865

new_rows.append((entry, new_parents))

866

# get additional ids that are present in parents and not in this tree.

867

deleted_ids = set()

868

for tree in parent_trees:

869

deleted_ids.update(set(tree.inventory._byid).difference(checked_ids))

870

# add the deleted ids to the dirstate. deleted files are represented as

871

# a file with dirname '', basename ''

872

for file_id in deleted_ids:

873

# add these ids to the deleted block

874

checked_ids.add(file_id)

875

# deleted items have a synthetic entry.

876

entry = ('/', 'RECYCLED.BIN', 'file', file_id.encode('utf8'), 0,

877

DirState.NULLSTAT, '')

878

new_parents = [None] * parent_tree_count

879

for position, parent_tree in enumerate(parent_trees):

880

# revision_utf8, KIND, dirname, basename, size, executable, sha

881

new_parents[position] = self._parent_info(parent_tree, file_id)

882

assert None not in new_parents

883

new_rows.append((entry, new_parents))

884

885

# sort all the rows

886

new_rows = sorted(new_rows)

887

self._rows_to_current_state(new_rows)

888

self._parents = [rev_id for rev_id, tree in trees]

889

self._ghosts = list(ghosts)

890

self._header_state = DirState.IN_MEMORY_MODIFIED

891

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

892

893

def set_state_from_inventory(self, new_inv):

894

"""Set new_inv as the current state.

895

896

:param new_inv: The inventory object to set current state from.

897

"""

898

self._read_dirblocks_if_needed()

899

# sketch:

900

# generate a byid index of the dirstate

901

parent_rows = {}

902

for row, parents in self._iter_rows():

903

parent_rows[row[3]] = parents

904

905

num_present_parents = len(self._parents) - len(self._ghosts)

906

# walk the new inventory in directory order, copying parent data

907

# from the id index

908

new_rows = []

909

for path, entry in new_inv.iter_entries_by_dir():

910

dirname, basename = os.path.split(path.encode('utf8'))

911

kind = entry.kind

912

fileid_utf8 = entry.file_id.encode('utf8')

913

if kind == 'file':

914

size = entry.text_size or 0

915

sha1 = entry.text_sha1 or ''

916

elif kind == 'symlink':

917

size = 0

918

sha1 = (entry.symlink_target or '').encode('utf8')

919

else:

920

size = 0

921

sha1 = ''

922

try:

923

parents = parent_rows[fileid_utf8]

924

del parent_rows[fileid_utf8]

925

except KeyError:

926

parents = [DirState.NULL_PARENT_ROW] * num_present_parents

927

new_row = (dirname, basename, kind, fileid_utf8, size, DirState.NULLSTAT, sha1), parents

928

new_rows.append(new_row)

929

# append deleted data to the end of the tree as usual.

930

for fileid_utf8, parents in parent_rows.items():

931

if not parents:

932

# this row was only present in the old state, had no parents

933

continue

934

# deleted items have a synthetic entry.

935

new_row = ('/', 'RECYCLED.BIN', 'file', fileid_utf8, 0,

936

DirState.NULLSTAT, ''), parents

937

new_rows.append(new_row)

938

939

# sort all the rows (the ones in parents not in current may be unsorted)

940

new_rows = sorted(new_rows)

941

self._rows_to_current_state(new_rows)

942

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

943

944

945

def pack_stat(st, _encode=base64.encodestring, _pack=struct.pack):

946

"""Convert stat values into a packed representation."""

947

# jam 20060614 it isn't really worth removing more entries if we

948

# are going to leave it in packed form.

949

# With only st_mtime and st_mode filesize is 5.5M and read time is 275ms

950

# With all entries filesize is 5.9M and read time is mabye 280ms

951

# well within the noise margin

952

953

# base64.encode always adds a final newline, so strip it off

954

return _encode(_pack('>llllll'

955

, st.st_size, st.st_mtime, st.st_ctime

956

, st.st_dev, st.st_ino, st.st_mode))[:-1]

957

Older »