/brz/remove-bazaar : revision 5807.4.6

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/dirstate.py

Committer: John Arbash Meinel
Date: 2011-04-22 14:12:22 UTC
mfrom: (5809 +trunk)
mto: This revision was merged to the branch mainline in revision 5836.
Revision ID: john@arbash-meinel.com-20110422141222-nx2j0hbkihcb8j16

Merge newer bzr.dev and resolve conflicts.
Try to write some documentation about how the _dirblock_state works.
Fix up the tests so that they pass again.

files added:
.bzrignore

.rsyncexclude

.testr.conf

BRANCH.TODO

COPYING.txt

INSTALL

MANIFEST.in

Makefile

NEWS

README

README_BDIST_RPM

TODO

apport

apport/README

apport/bzr-crashdb.conf

apport/source_bzr.py

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cethread.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_test_script.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/controldir.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/conf.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/location-alias.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/help_topics/es

bzrlib/help_topics/es/conflict-types.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/library_state.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/mergetools.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/repository.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/plugins/weave_fmt/xml4.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/pyutils.py

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/recordcounter.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_revert.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/fixtures.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_controldir_colo

bzrlib/tests/per_controldir_colo/__init__.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/helpers.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_check_reconcile.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/scenarios.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/testui.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/gio_transport.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/bash

contrib/bash/bzr

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/README

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/documenting-changes.txt

doc/developers/ec2.txt

doc/developers/fetch.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/principles.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/transports.txt

doc/developers/ui.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/developers/win32_build_setup.txt

doc/developers/xdg_config_spec.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.3.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/release-template.txt

doc/en/release-notes/series-template.txt

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/en/whats-new

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/en/whats-new/whats-new-in-2.4.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/index.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/fixed-in.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/http_client.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/py2exe_boot_common.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/dirstate.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""DirState objects record the state of a directory and its bzr metadata.

Pseudo EBNF grammar for the state file. Fields are separated by NULLs, and

lines by NL. The field delimiters are ommitted in the grammar, line delimiters

are not - this is done for clarity of reading. All string data is in utf8.

MINIKIND = "f" | "d" | "l" | "a" | "r" | "t";

NL = "\n";

NULL = "\0";

WHOLE_NUMBER = {digit}, digit;

BOOLEAN = "y" | "n";

REVISION_ID = a non-empty utf8 string;

dirstate format = header line, full checksum, row count, parent details,

ghost_details, entries;

header line = "#bazaar dirstate flat format 3", NL;

full checksum = "crc32: ", ["-"], WHOLE_NUMBER, NL;

row count = "num_entries: ", WHOLE_NUMBER, NL;

parent_details = WHOLE NUMBER, {REVISION_ID}* NL;

ghost_details = WHOLE NUMBER, {REVISION_ID}*, NL;

entries = {entry};

entry = entry_key, current_entry_details, {parent_entry_details};

entry_key = dirname, basename, fileid;

current_entry_details = common_entry_details, working_entry_details;

parent_entry_details = common_entry_details, history_entry_details;

common_entry_details = MINIKIND, fingerprint, size, executable

working_entry_details = packed_stat

history_entry_details = REVISION_ID;

executable = BOOLEAN;

size = WHOLE_NUMBER;

fingerprint = a nonempty utf8 sequence with meaning defined by minikind.

Given this definition, the following is useful to know:

entry (aka row) - all the data for a given key.

entry[0]: The key (dirname, basename, fileid)

entry[0][0]: dirname

entry[0][1]: basename

entry[0][2]: fileid

entry[1]: The tree(s) data for this path and id combination.

entry[1][0]: The current tree

entry[1][1]: The second tree

For an entry for a tree, we have (using tree 0 - current tree) to demonstrate:

entry[1][0][0]: minikind

entry[1][0][1]: fingerprint

entry[1][0][2]: size

entry[1][0][3]: executable

entry[1][0][4]: packed_stat

OR (for non tree-0)

entry[1][1][4]: revision_id

There may be multiple rows at the root, one per id present in the root, so the

in memory root row is now:

self._dirblocks[0] -> ('', [entry ...]),

and the entries in there are

entries[0][0]: ''

entries[0][1]: ''

entries[0][2]: file_id

entries[1][0]: The tree data for the current tree for this fileid at /

etc.

Kinds:

'r' is a relocated entry: This path is not present in this tree with this id,

but the id can be found at another location. The fingerprint is used to

point to the target location.

'a' is an absent entry: In that tree the id is not present at this path.

'd' is a directory entry: This path in this tree is a directory with the

current file id. There is no fingerprint for directories.

'f' is a file entry: As for directory, but it's a file. The fingerprint is the

sha1 value of the file's canonical form, i.e. after any read filters have

been applied to the convenience form stored in the working tree.

'l' is a symlink entry: As for directory, but a symlink. The fingerprint is the

link target.

't' is a reference to a nested subtree; the fingerprint is the referenced

revision.

Ordering:

The entries on disk and in memory are ordered according to the following keys:

directory, as a list of components

filename

file-id

100

101

--- Format 1 had the following different definition: ---

102

rows = dirname, NULL, basename, NULL, MINIKIND, NULL, fileid_utf8, NULL,

103

WHOLE NUMBER (* size *), NULL, packed stat, NULL, sha1|symlink target,

104

{PARENT ROW}

105

PARENT ROW = NULL, revision_utf8, NULL, MINIKIND, NULL, dirname, NULL,

106

basename, NULL, WHOLE NUMBER (* size *), NULL, "y" | "n", NULL,

107

SHA1

108

109

PARENT ROW's are emitted for every parent that is not in the ghosts details

110

line. That is, if the parents are foo, bar, baz, and the ghosts are bar, then

111

each row will have a PARENT ROW for foo and baz, but not for bar.

112

113

114

In any tree, a kind of 'moved' indicates that the fingerprint field

115

(which we treat as opaque data specific to the 'kind' anyway) has the

116

details for the id of this row in that tree.

117

118

I'm strongly tempted to add a id->path index as well, but I think that

119

where we need id->path mapping; we also usually read the whole file, so

120

I'm going to skip that for the moment, as we have the ability to locate

121

via bisect any path in any tree, and if we lookup things by path, we can

122

accumulate an id->path mapping as we go, which will tend to match what we

123

looked for.

124

125

I plan to implement this asap, so please speak up now to alter/tweak the

126

design - and once we stabilise on this, I'll update the wiki page for

127

it.

128

129

The rationale for all this is that we want fast operations for the

130

common case (diff/status/commit/merge on all files) and extremely fast

131

operations for the less common but still occurs a lot status/diff/commit

132

on specific files). Operations on specific files involve a scan for all

133

the children of a path, *in every involved tree*, which the current

134

format did not accommodate.

135

----

136

137

Design priorities:

138

1) Fast end to end use for bzr's top 5 uses cases. (commmit/diff/status/merge/???)

139

2) fall back current object model as needed.

140

3) scale usably to the largest trees known today - say 50K entries. (mozilla

141

is an example of this)

142

143

144

Locking:

145

Eventually reuse dirstate objects across locks IFF the dirstate file has not

146

been modified, but will require that we flush/ignore cached stat-hit data

147

because we won't want to restat all files on disk just because a lock was

148

acquired, yet we cannot trust the data after the previous lock was released.

149

150

Memory representation:

151

vector of all directories, and vector of the childen ?

152

i.e.

153

root_entrie = (direntry for root, [parent_direntries_for_root]),

154

dirblocks = [

155

('', ['data for achild', 'data for bchild', 'data for cchild'])

156

('dir', ['achild', 'cchild', 'echild'])

157

]

158

- single bisect to find N subtrees from a path spec

159

- in-order for serialisation - this is 'dirblock' grouping.

160

- insertion of a file '/a' affects only the '/' child-vector, that is, to

161

insert 10K elements from scratch does not generates O(N^2) memoves of a

162

single vector, rather each individual, which tends to be limited to a

163

manageable number. Will scale badly on trees with 10K entries in a

164

single directory. compare with Inventory.InventoryDirectory which has

165

a dictionary for the children. No bisect capability, can only probe for

166

exact matches, or grab all elements and sort.

167

- What's the risk of error here? Once we have the base format being processed

168

we should have a net win regardless of optimality. So we are going to

169

go with what seems reasonable.

170

open questions:

171

172

Maybe we should do a test profile of the core structure - 10K simulated

173

searches/lookups/etc?

174

175

Objects for each row?

176

The lifetime of Dirstate objects is current per lock, but see above for

177

possible extensions. The lifetime of a row from a dirstate is expected to be

178

very short in the optimistic case: which we are optimising for. For instance,

179

subtree status will determine from analysis of the disk data what rows need to

180

be examined at all, and will be able to determine from a single row whether

181

that file has altered or not, so we are aiming to process tens of thousands of

182

entries each second within the dirstate context, before exposing anything to

183

the larger codebase. This suggests we want the time for a single file

184

comparison to be < 0.1 milliseconds. That would give us 10000 paths per second

185

processed, and to scale to 100 thousand we'll another order of magnitude to do

186

that. Now, as the lifetime for all unchanged entries is the time to parse, stat

187

the file on disk, and then immediately discard, the overhead of object creation

188

becomes a significant cost.

189

190

Figures: Creating a tuple from 3 elements was profiled at 0.0625

191

microseconds, whereas creating a object which is subclassed from tuple was

192

0.500 microseconds, and creating an object with 3 elements and slots was 3

193

microseconds long. 0.1 milliseconds is 100 microseconds, and ideally we'll get

194

down to 10 microseconds for the total processing - having 33% of that be object

195

creation is a huge overhead. There is a potential cost in using tuples within

196

each row which is that the conditional code to do comparisons may be slower

197

than method invocation, but method invocation is known to be slow due to stack

198

frame creation, so avoiding methods in these tight inner loops in unfortunately

199

desirable. We can consider a pyrex version of this with objects in future if

200

desired.

201

202

"""

203

204

import bisect

205

import binascii

206

import errno

207

import operator

208

import os

209

from stat import S_IEXEC

210

import stat

211

import struct

212

import sys

213

import time

214

import zlib

215

216

from bzrlib import (

217

cache_utf8,

218

debug,

219

errors,

220

inventory,

221

lock,

222

osutils,

223

static_tuple,

224

trace,

225

)

226

227

228

# This is the Windows equivalent of ENOTDIR

229

# It is defined in pywin32.winerror, but we don't want a strong dependency for

230

# just an error code.

231

ERROR_PATH_NOT_FOUND = 3

232

ERROR_DIRECTORY = 267

233

234

235

if not getattr(struct, '_compile', None):

236

# Cannot pre-compile the dirstate pack_stat

237

def pack_stat(st, _encode=binascii.b2a_base64, _pack=struct.pack):

238

"""Convert stat values into a packed representation."""

239

return _encode(_pack('>LLLLLL', st.st_size, int(st.st_mtime),

240

int(st.st_ctime), st.st_dev, st.st_ino & 0xFFFFFFFF,

241

st.st_mode))[:-1]

242

else:

243

# compile the struct compiler we need, so as to only do it once

244

from _struct import Struct

245

_compiled_pack = Struct('>LLLLLL').pack

246

def pack_stat(st, _encode=binascii.b2a_base64, _pack=_compiled_pack):

247

"""Convert stat values into a packed representation."""

248

# jam 20060614 it isn't really worth removing more entries if we

249

# are going to leave it in packed form.

250

# With only st_mtime and st_mode filesize is 5.5M and read time is 275ms

251

# With all entries, filesize is 5.9M and read time is maybe 280ms

252

# well within the noise margin

253

254

# base64 encoding always adds a final newline, so strip it off

255

# The current version

256

return _encode(_pack(st.st_size, int(st.st_mtime), int(st.st_ctime),

257

st.st_dev, st.st_ino & 0xFFFFFFFF, st.st_mode))[:-1]

258

# This is 0.060s / 1.520s faster by not encoding as much information

259

# return _encode(_pack('>LL', int(st.st_mtime), st.st_mode))[:-1]

260

# This is not strictly faster than _encode(_pack())[:-1]

261

# return '%X.%X.%X.%X.%X.%X' % (

262

# st.st_size, int(st.st_mtime), int(st.st_ctime),

263

# st.st_dev, st.st_ino, st.st_mode)

264

# Similar to the _encode(_pack('>LL'))

265

# return '%X.%X' % (int(st.st_mtime), st.st_mode)

266

267

268

def _unpack_stat(packed_stat):

269

"""Turn a packed_stat back into the stat fields.

270

271

This is meant as a debugging tool, should not be used in real code.

272

"""

273

(st_size, st_mtime, st_ctime, st_dev, st_ino,

274

st_mode) = struct.unpack('>LLLLLL', binascii.a2b_base64(packed_stat))

275

return dict(st_size=st_size, st_mtime=st_mtime, st_ctime=st_ctime,

276

st_dev=st_dev, st_ino=st_ino, st_mode=st_mode)

277

278

279

class SHA1Provider(object):

280

"""An interface for getting sha1s of a file."""

281

282

def sha1(self, abspath):

283

"""Return the sha1 of a file given its absolute path.

284

285

:param abspath: May be a filesystem encoded absolute path

286

or a unicode path.

287

"""

288

raise NotImplementedError(self.sha1)

289

290

def stat_and_sha1(self, abspath):

291

"""Return the stat and sha1 of a file given its absolute path.

292

293

:param abspath: May be a filesystem encoded absolute path

294

or a unicode path.

295

296

Note: the stat should be the stat of the physical file

297

while the sha may be the sha of its canonical content.

298

"""

299

raise NotImplementedError(self.stat_and_sha1)

300

301

302

class DefaultSHA1Provider(SHA1Provider):

303

"""A SHA1Provider that reads directly from the filesystem."""

304

305

def sha1(self, abspath):

306

"""Return the sha1 of a file given its absolute path."""

307

return osutils.sha_file_by_name(abspath)

308

309

def stat_and_sha1(self, abspath):

310

"""Return the stat and sha1 of a file given its absolute path."""

311

file_obj = file(abspath, 'rb')

312

try:

313

statvalue = os.fstat(file_obj.fileno())

314

sha1 = osutils.sha_file(file_obj)

315

finally:

316

file_obj.close()

317

return statvalue, sha1

318

319

320

class DirState(object):

321

"""Record directory and metadata state for fast access.

322

323

A dirstate is a specialised data structure for managing local working

324

tree state information. Its not yet well defined whether it is platform

325

specific, and if it is how we detect/parameterize that.

326

327

Dirstates use the usual lock_write, lock_read and unlock mechanisms.

328

Unlike most bzr disk formats, DirStates must be locked for reading, using

329

lock_read. (This is an os file lock internally.) This is necessary

330

because the file can be rewritten in place.

331

332

DirStates must be explicitly written with save() to commit changes; just

333

unlocking them does not write the changes to disk.

334

"""

335

336

_kind_to_minikind = {

337

'absent': 'a',

338

'file': 'f',

339

'directory': 'd',

340

'relocated': 'r',

341

'symlink': 'l',

342

'tree-reference': 't',

343

}

344

_minikind_to_kind = {

345

'a': 'absent',

346

'f': 'file',

347

'd': 'directory',

348

'l':'symlink',

349

'r': 'relocated',

350

't': 'tree-reference',

351

}

352

_stat_to_minikind = {

353

stat.S_IFDIR:'d',

354

stat.S_IFREG:'f',

355

stat.S_IFLNK:'l',

356

}

357

_to_yesno = {True:'y', False: 'n'} # TODO profile the performance gain

358

# of using int conversion rather than a dict here. AND BLAME ANDREW IF

359

# it is faster.

360

361

# TODO: jam 20070221 Figure out what to do if we have a record that exceeds

362

# the BISECT_PAGE_SIZE. For now, we just have to make it large enough

363

# that we are sure a single record will always fit.

364

BISECT_PAGE_SIZE = 4096

365

366

NOT_IN_MEMORY = 0

367

IN_MEMORY_UNMODIFIED = 1

368

IN_MEMORY_MODIFIED = 2

369

IN_MEMORY_HASH_MODIFIED = 3 # Only hash-cache updates

370

371

# A pack_stat (the x's) that is just noise and will never match the output

372

# of base64 encode.

373

NULLSTAT = 'x' * 32

374

NULL_PARENT_DETAILS = ('a', '', 0, False, '')

375

376

HEADER_FORMAT_2 = '#bazaar dirstate flat format 2\n'

377

HEADER_FORMAT_3 = '#bazaar dirstate flat format 3\n'

378

379

def __init__(self, path, sha1_provider, worth_saving_limit=0):

380

"""Create a DirState object.

381

382

:param path: The path at which the dirstate file on disk should live.

383

:param sha1_provider: an object meeting the SHA1Provider interface.

384

:param worth_saving_limit: when the exact number of hash changed

385

entries is known, only bother saving the dirstate if more than

386

this count of entries have changed.

387

-1 means never save hash changes, 0 means always save hash changes.

388

"""

389

# _header_state and _dirblock_state represent the current state

390

# of the dirstate metadata and the per-row data respectiely.

391

# NOT_IN_MEMORY indicates that no data is in memory

392

# IN_MEMORY_UNMODIFIED indicates that what we have in memory

393

# is the same as is on disk

394

# IN_MEMORY_MODIFIED indicates that we have a modified version

395

# of what is on disk.

396

# In future we will add more granularity, for instance _dirblock_state

397

# will probably support partially-in-memory as a separate variable,

398

# allowing for partially-in-memory unmodified and partially-in-memory

399

# modified states.

400

self._header_state = DirState.NOT_IN_MEMORY

401

self._dirblock_state = DirState.NOT_IN_MEMORY

402

# If true, an error has been detected while updating the dirstate, and

403

# for safety we're not going to commit to disk.

404

self._changes_aborted = False

405

self._dirblocks = []

406

self._ghosts = []

407

self._parents = []

408

self._state_file = None

409

self._filename = path

410

self._lock_token = None

411

self._lock_state = None

412

self._id_index = None

413

# a map from packed_stat to sha's.

414

self._packed_stat_index = None

415

self._end_of_header = None

416

self._cutoff_time = None

417

self._split_path_cache = {}

418

self._bisect_page_size = DirState.BISECT_PAGE_SIZE

419

self._sha1_provider = sha1_provider

420

if 'hashcache' in debug.debug_flags:

421

self._sha1_file = self._sha1_file_and_mutter

422

else:

423

self._sha1_file = self._sha1_provider.sha1

424

# These two attributes provide a simple cache for lookups into the

425

# dirstate in-memory vectors. By probing respectively for the last

426

# block, and for the next entry, we save nearly 2 bisections per path

427

# during commit.

428

self._last_block_index = None

429

self._last_entry_index = None

430

# The set of known hash changes

431

self._known_hash_changes = set()

432

# How many hash changed entries can we have without saving

433

self._worth_saving_limit = worth_saving_limit

434

435

def __repr__(self):

436

return "%s(%r)" % \

437

(self.__class__.__name__, self._filename)

438

439

def _mark_modified(self, hash_changed_entries=None, header_modified=False):

440

"""Mark this dirstate as modified.

441

442

:param hash_changed_entries: if non-None, mark just these entries as

443

having their hash modified.

444

:param header_modified: mark the header modified as well, not just the

445

dirblocks.

446

"""

447

#trace.mutter_callsite(3, "modified hash entries: %s", hash_changed_entries)

448

if hash_changed_entries:

449

self._known_hash_changes.update([e[0] for e in hash_changed_entries])

450

if self._dirblock_state in (DirState.NOT_IN_MEMORY,

451

DirState.IN_MEMORY_UNMODIFIED):

452

# If the dirstate is already marked a IN_MEMORY_MODIFIED, then

453

# that takes precedence.

454

self._dirblock_state = DirState.IN_MEMORY_HASH_MODIFIED

455

else:

456

# TODO: Since we now have a IN_MEMORY_HASH_MODIFIED state, we

457

# should fail noisily if someone tries to set

458

# IN_MEMORY_MODIFIED but we don't have a write-lock!

459

# We don't know exactly what changed so disable smart saving

460

self._dirblock_state = DirState.IN_MEMORY_MODIFIED

461

if header_modified:

462

self._header_state = DirState.IN_MEMORY_MODIFIED

463

464

def _mark_unmodified(self):

465

"""Mark this dirstate as unmodified."""

466

self._header_state = DirState.IN_MEMORY_UNMODIFIED

467

self._dirblock_state = DirState.IN_MEMORY_UNMODIFIED

468

self._known_hash_changes = set()

469

470

def add(self, path, file_id, kind, stat, fingerprint):

471

"""Add a path to be tracked.

472

473

:param path: The path within the dirstate - '' is the root, 'foo' is the

474

path foo within the root, 'foo/bar' is the path bar within foo

475

within the root.

476

:param file_id: The file id of the path being added.

477

:param kind: The kind of the path, as a string like 'file',

478

'directory', etc.

479

:param stat: The output of os.lstat for the path.

480

:param fingerprint: The sha value of the file's canonical form (i.e.

481

after any read filters have been applied),

482

or the target of a symlink,

483

or the referenced revision id for tree-references,

484

or '' for directories.

485

"""

486

# adding a file:

487

# find the block its in.

488

# find the location in the block.

489

# check its not there

490

# add it.

491

#------- copied from inventory.ensure_normalized_name - keep synced.

492

# --- normalized_filename wants a unicode basename only, so get one.

493

dirname, basename = osutils.split(path)

494

# we dont import normalized_filename directly because we want to be

495

# able to change the implementation at runtime for tests.

496

norm_name, can_access = osutils.normalized_filename(basename)

497

if norm_name != basename:

498

if can_access:

499

basename = norm_name

500

else:

501

raise errors.InvalidNormalization(path)

502

# you should never have files called . or ..; just add the directory

503

# in the parent, or according to the special treatment for the root

504

if basename == '.' or basename == '..':

505

raise errors.InvalidEntryName(path)

506

# now that we've normalised, we need the correct utf8 path and

507

# dirname and basename elements. This single encode and split should be

508

# faster than three separate encodes.

509

utf8path = (dirname + '/' + basename).strip('/').encode('utf8')

510

dirname, basename = osutils.split(utf8path)

511

# uses __class__ for speed; the check is needed for safety

512

if file_id.__class__ is not str:

513

raise AssertionError(

514

"must be a utf8 file_id not %s" % (type(file_id), ))

515

# Make sure the file_id does not exist in this tree

516

rename_from = None

517

file_id_entry = self._get_entry(0, fileid_utf8=file_id, include_deleted=True)

518

if file_id_entry != (None, None):

519

if file_id_entry[1][0][0] == 'a':

520

if file_id_entry[0] != (dirname, basename, file_id):

521

# set the old name's current operation to rename

522

self.update_minimal(file_id_entry[0],

523

'r',

524

path_utf8='',

525

packed_stat='',

526

fingerprint=utf8path

527

)

528

rename_from = file_id_entry[0][0:2]

529

else:

530

path = osutils.pathjoin(file_id_entry[0][0], file_id_entry[0][1])

531

kind = DirState._minikind_to_kind[file_id_entry[1][0][0]]

532

info = '%s:%s' % (kind, path)

533

raise errors.DuplicateFileId(file_id, info)

534

first_key = (dirname, basename, '')

535

block_index, present = self._find_block_index_from_key(first_key)

536

if present:

537

# check the path is not in the tree

538

block = self._dirblocks[block_index][1]

539

entry_index, _ = self._find_entry_index(first_key, block)

540

while (entry_index < len(block) and

541

block[entry_index][0][0:2] == first_key[0:2]):

542

if block[entry_index][1][0][0] not in 'ar':

543

# this path is in the dirstate in the current tree.

544

raise Exception, "adding already added path!"

545

entry_index += 1

546

else:

547

# The block where we want to put the file is not present. But it

548

# might be because the directory was empty, or not loaded yet. Look

549

# for a parent entry, if not found, raise NotVersionedError

550

parent_dir, parent_base = osutils.split(dirname)

551

parent_block_idx, parent_entry_idx, _, parent_present = \

552

self._get_block_entry_index(parent_dir, parent_base, 0)

553

if not parent_present:

554

raise errors.NotVersionedError(path, str(self))

555

self._ensure_block(parent_block_idx, parent_entry_idx, dirname)

556

block = self._dirblocks[block_index][1]

557

entry_key = (dirname, basename, file_id)

558

if stat is None:

559

size = 0

560

packed_stat = DirState.NULLSTAT

561

else:

562

size = stat.st_size

563

packed_stat = pack_stat(stat)

564

parent_info = self._empty_parent_info()

565

minikind = DirState._kind_to_minikind[kind]

566

if rename_from is not None:

567

if rename_from[0]:

568

old_path_utf8 = '%s/%s' % rename_from

569

else:

570

old_path_utf8 = rename_from[1]

571

parent_info[0] = ('r', old_path_utf8, 0, False, '')

572

if kind == 'file':

573

entry_data = entry_key, [

574

(minikind, fingerprint, size, False, packed_stat),

575

] + parent_info

576

elif kind == 'directory':

577

entry_data = entry_key, [

578

(minikind, '', 0, False, packed_stat),

579

] + parent_info

580

elif kind == 'symlink':

581

entry_data = entry_key, [

582

(minikind, fingerprint, size, False, packed_stat),

583

] + parent_info

584

elif kind == 'tree-reference':

585

entry_data = entry_key, [

586

(minikind, fingerprint, 0, False, packed_stat),

587

] + parent_info

588

else:

589

raise errors.BzrError('unknown kind %r' % kind)

590

entry_index, present = self._find_entry_index(entry_key, block)

591

if not present:

592

block.insert(entry_index, entry_data)

593

else:

594

if block[entry_index][1][0][0] != 'a':

595

raise AssertionError(" %r(%r) already added" % (basename, file_id))

596

block[entry_index][1][0] = entry_data[1][0]

597

598

if kind == 'directory':

599

# insert a new dirblock

600

self._ensure_block(block_index, entry_index, utf8path)

601

self._mark_modified()

602

if self._id_index:

603

self._add_to_id_index(self._id_index, entry_key)

604

605

def _bisect(self, paths):

606

"""Bisect through the disk structure for specific rows.

607

608

:param paths: A list of paths to find

609

:return: A dict mapping path => entries for found entries. Missing

610

entries will not be in the map.

611

The list is not sorted, and entries will be populated

612

based on when they were read.

613

"""

614

self._requires_lock()

615

# We need the file pointer to be right after the initial header block

616

self._read_header_if_needed()

617

# If _dirblock_state was in memory, we should just return info from

618

# there, this function is only meant to handle when we want to read

619

# part of the disk.

620

if self._dirblock_state != DirState.NOT_IN_MEMORY:

621

raise AssertionError("bad dirblock state %r" % self._dirblock_state)

622

623

# The disk representation is generally info + '\0\n\0' at the end. But

624

# for bisecting, it is easier to treat this as '\0' + info + '\0\n'

625

# Because it means we can sync on the '\n'

626

state_file = self._state_file

627

file_size = os.fstat(state_file.fileno()).st_size

628

# We end up with 2 extra fields, we should have a trailing '\n' to

629

# ensure that we read the whole record, and we should have a precursur

630

# '' which ensures that we start after the previous '\n'

631

entry_field_count = self._fields_per_entry() + 1

632

633

low = self._end_of_header

634

high = file_size - 1 # Ignore the final '\0'

635

# Map from (dir, name) => entry

636

found = {}

637

638

# Avoid infinite seeking

639

max_count = 30*len(paths)

640

count = 0

641

# pending is a list of places to look.

642

# each entry is a tuple of low, high, dir_names

643

# low -> the first byte offset to read (inclusive)

644

# high -> the last byte offset (inclusive)

645

# dir_names -> The list of (dir, name) pairs that should be found in

646

# the [low, high] range

647

pending = [(low, high, paths)]

648

649

page_size = self._bisect_page_size

650

651

fields_to_entry = self._get_fields_to_entry()

652

653

while pending:

654

low, high, cur_files = pending.pop()

655

656

if not cur_files or low >= high:

657

# Nothing to find

658

continue

659

660

count += 1

661

if count > max_count:

662

raise errors.BzrError('Too many seeks, most likely a bug.')

663

664

mid = max(low, (low+high-page_size)/2)

665

666

state_file.seek(mid)

667

# limit the read size, so we don't end up reading data that we have

668

# already read.

669

read_size = min(page_size, (high-mid)+1)

670

block = state_file.read(read_size)

671

672

start = mid

673

entries = block.split('\n')

674

675

if len(entries) < 2:

676

# We didn't find a '\n', so we cannot have found any records.

677

# So put this range back and try again. But we know we have to

678

# increase the page size, because a single read did not contain

679

# a record break (so records must be larger than page_size)

680

page_size *= 2

681

pending.append((low, high, cur_files))

682

continue

683

684

# Check the first and last entries, in case they are partial, or if

685

# we don't care about the rest of this page

686

first_entry_num = 0

687

first_fields = entries[0].split('\0')

688

if len(first_fields) < entry_field_count:

689

# We didn't get the complete first entry

690

# so move start, and grab the next, which

691

# should be a full entry

692

start += len(entries[0])+1

693

first_fields = entries[1].split('\0')

694

first_entry_num = 1

695

696

if len(first_fields) <= 2:

697

# We didn't even get a filename here... what do we do?

698

# Try a large page size and repeat this query

699

page_size *= 2

700

pending.append((low, high, cur_files))

701

continue

702

else:

703

# Find what entries we are looking for, which occur before and

704

# after this first record.

705

after = start

706

if first_fields[1]:

707

first_path = first_fields[1] + '/' + first_fields[2]

708

else:

709

first_path = first_fields[2]

710

first_loc = _bisect_path_left(cur_files, first_path)

711

712

# These exist before the current location

713

pre = cur_files[:first_loc]

714

# These occur after the current location, which may be in the

715

# data we read, or might be after the last entry

716

post = cur_files[first_loc:]

717

718

if post and len(first_fields) >= entry_field_count:

719

# We have files after the first entry

720

721

# Parse the last entry

722

last_entry_num = len(entries)-1

723

last_fields = entries[last_entry_num].split('\0')

724

if len(last_fields) < entry_field_count:

725

# The very last hunk was not complete,

726

# read the previous hunk

727

after = mid + len(block) - len(entries[-1])

728

last_entry_num -= 1

729

last_fields = entries[last_entry_num].split('\0')

730

else:

731

after = mid + len(block)

732

733

if last_fields[1]:

734

last_path = last_fields[1] + '/' + last_fields[2]

735

else:

736

last_path = last_fields[2]

737

last_loc = _bisect_path_right(post, last_path)

738

739

middle_files = post[:last_loc]

740

post = post[last_loc:]

741

742

if middle_files:

743

# We have files that should occur in this block

744

# (>= first, <= last)

745

# Either we will find them here, or we can mark them as

746

# missing.

747

748

if middle_files[0] == first_path:

749

# We might need to go before this location

750

pre.append(first_path)

751

if middle_files[-1] == last_path:

752

post.insert(0, last_path)

753

754

# Find out what paths we have

755

paths = {first_path:[first_fields]}

756

# last_path might == first_path so we need to be

757

# careful if we should append rather than overwrite

758

if last_entry_num != first_entry_num:

759

paths.setdefault(last_path, []).append(last_fields)

760

for num in xrange(first_entry_num+1, last_entry_num):

761

# TODO: jam 20070223 We are already splitting here, so

762

# shouldn't we just split the whole thing rather

763

# than doing the split again in add_one_record?

764

fields = entries[num].split('\0')

765

if fields[1]:

766

path = fields[1] + '/' + fields[2]

767

else:

768

path = fields[2]

769

paths.setdefault(path, []).append(fields)

770

771

for path in middle_files:

772

for fields in paths.get(path, []):

773

# offset by 1 because of the opening '\0'

774

# consider changing fields_to_entry to avoid the

775

# extra list slice

776

entry = fields_to_entry(fields[1:])

777

found.setdefault(path, []).append(entry)

778

779

# Now we have split up everything into pre, middle, and post, and

780

# we have handled everything that fell in 'middle'.

781

# We add 'post' first, so that we prefer to seek towards the

782

# beginning, so that we will tend to go as early as we need, and

783

# then only seek forward after that.

784

if post:

785

pending.append((after, high, post))

786

if pre:

787

pending.append((low, start-1, pre))

788

789

# Consider that we may want to return the directory entries in sorted

790

# order. For now, we just return them in whatever order we found them,

791

# and leave it up to the caller if they care if it is ordered or not.

792

return found

793

794

def _bisect_dirblocks(self, dir_list):

795

"""Bisect through the disk structure to find entries in given dirs.

796

797

_bisect_dirblocks is meant to find the contents of directories, which

798

differs from _bisect, which only finds individual entries.

799

800

:param dir_list: A sorted list of directory names ['', 'dir', 'foo'].

801

:return: A map from dir => entries_for_dir

802

"""

803

# TODO: jam 20070223 A lot of the bisecting logic could be shared

804

# between this and _bisect. It would require parameterizing the

805

# inner loop with a function, though. We should evaluate the

806

# performance difference.

807

self._requires_lock()

808

# We need the file pointer to be right after the initial header block

809

self._read_header_if_needed()

810

# If _dirblock_state was in memory, we should just return info from

811

# there, this function is only meant to handle when we want to read

812

# part of the disk.

813

if self._dirblock_state != DirState.NOT_IN_MEMORY:

814

raise AssertionError("bad dirblock state %r" % self._dirblock_state)

815

# The disk representation is generally info + '\0\n\0' at the end. But

816

# for bisecting, it is easier to treat this as '\0' + info + '\0\n'

817

# Because it means we can sync on the '\n'

818

state_file = self._state_file

819

file_size = os.fstat(state_file.fileno()).st_size

820

# We end up with 2 extra fields, we should have a trailing '\n' to

821

# ensure that we read the whole record, and we should have a precursur

822

# '' which ensures that we start after the previous '\n'

823

entry_field_count = self._fields_per_entry() + 1

824

825

low = self._end_of_header

826

high = file_size - 1 # Ignore the final '\0'

827

# Map from dir => entry

828

found = {}

829

830

# Avoid infinite seeking

831

max_count = 30*len(dir_list)

832

count = 0

833

# pending is a list of places to look.

834

# each entry is a tuple of low, high, dir_names

835

# low -> the first byte offset to read (inclusive)

836

# high -> the last byte offset (inclusive)

837

# dirs -> The list of directories that should be found in

838

# the [low, high] range

839

pending = [(low, high, dir_list)]

840

841

page_size = self._bisect_page_size

842

843

fields_to_entry = self._get_fields_to_entry()

844

845

while pending:

846

low, high, cur_dirs = pending.pop()

847

848

if not cur_dirs or low >= high:

849

# Nothing to find

850

continue

851

852

count += 1

853

if count > max_count:

854

raise errors.BzrError('Too many seeks, most likely a bug.')

855

856

mid = max(low, (low+high-page_size)/2)

857

858

state_file.seek(mid)

859

# limit the read size, so we don't end up reading data that we have

860

# already read.

861

read_size = min(page_size, (high-mid)+1)

862

block = state_file.read(read_size)

863

864

start = mid

865

entries = block.split('\n')

866

867

if len(entries) < 2:

868

# We didn't find a '\n', so we cannot have found any records.

869

# So put this range back and try again. But we know we have to

870

# increase the page size, because a single read did not contain

871

# a record break (so records must be larger than page_size)

872

page_size *= 2

873

pending.append((low, high, cur_dirs))

874

continue

875

876

# Check the first and last entries, in case they are partial, or if

877

# we don't care about the rest of this page

878

first_entry_num = 0

879

first_fields = entries[0].split('\0')

880

if len(first_fields) < entry_field_count:

881

# We didn't get the complete first entry

882

# so move start, and grab the next, which

883

# should be a full entry

884

start += len(entries[0])+1

885

first_fields = entries[1].split('\0')

886

first_entry_num = 1

887

888

if len(first_fields) <= 1:

889

# We didn't even get a dirname here... what do we do?

890

# Try a large page size and repeat this query

891

page_size *= 2

892

pending.append((low, high, cur_dirs))

893

continue

894

else:

895

# Find what entries we are looking for, which occur before and

896

# after this first record.

897

after = start

898

first_dir = first_fields[1]

899

first_loc = bisect.bisect_left(cur_dirs, first_dir)

900

901

# These exist before the current location

902

pre = cur_dirs[:first_loc]

903

# These occur after the current location, which may be in the

904

# data we read, or might be after the last entry

905

post = cur_dirs[first_loc:]

906

907

if post and len(first_fields) >= entry_field_count:

908

# We have records to look at after the first entry

909

910

# Parse the last entry

911

last_entry_num = len(entries)-1

912

last_fields = entries[last_entry_num].split('\0')

913

if len(last_fields) < entry_field_count:

914

# The very last hunk was not complete,

915

# read the previous hunk

916

after = mid + len(block) - len(entries[-1])

917

last_entry_num -= 1

918

last_fields = entries[last_entry_num].split('\0')

919

else:

920

after = mid + len(block)

921

922

last_dir = last_fields[1]

923

last_loc = bisect.bisect_right(post, last_dir)

924

925

middle_files = post[:last_loc]

926

post = post[last_loc:]

927

928

if middle_files:

929

# We have files that should occur in this block

930

# (>= first, <= last)

931

# Either we will find them here, or we can mark them as

932

# missing.

933

934

if middle_files[0] == first_dir:

935

# We might need to go before this location

936

pre.append(first_dir)

937

if middle_files[-1] == last_dir:

938

post.insert(0, last_dir)

939

940

# Find out what paths we have

941

paths = {first_dir:[first_fields]}

942

# last_dir might == first_dir so we need to be

943

# careful if we should append rather than overwrite

944

if last_entry_num != first_entry_num:

945

paths.setdefault(last_dir, []).append(last_fields)

946

for num in xrange(first_entry_num+1, last_entry_num):

947

# TODO: jam 20070223 We are already splitting here, so

948

# shouldn't we just split the whole thing rather

949

# than doing the split again in add_one_record?

950

fields = entries[num].split('\0')

951

paths.setdefault(fields[1], []).append(fields)

952

953

for cur_dir in middle_files:

954

for fields in paths.get(cur_dir, []):

955

# offset by 1 because of the opening '\0'

956

# consider changing fields_to_entry to avoid the

957

# extra list slice

958

entry = fields_to_entry(fields[1:])

959

found.setdefault(cur_dir, []).append(entry)

960

961

# Now we have split up everything into pre, middle, and post, and

962

# we have handled everything that fell in 'middle'.

963

# We add 'post' first, so that we prefer to seek towards the

964

# beginning, so that we will tend to go as early as we need, and

965

# then only seek forward after that.

966

if post:

967

pending.append((after, high, post))

968

if pre:

969

pending.append((low, start-1, pre))

970

971

return found

972

973

def _bisect_recursive(self, paths):

974

"""Bisect for entries for all paths and their children.

975

976

This will use bisect to find all records for the supplied paths. It

977

will then continue to bisect for any records which are marked as

978

directories. (and renames?)

979

980

:param paths: A sorted list of (dir, name) pairs

981

eg: [('', 'a'), ('', 'f'), ('a/b', 'c')]

982

:return: A dictionary mapping (dir, name, file_id) => [tree_info]

983

"""

984

# Map from (dir, name, file_id) => [tree_info]

985

found = {}

986

987

found_dir_names = set()

988

989

# Directories that have been read

990

processed_dirs = set()

991

# Get the ball rolling with the first bisect for all entries.

992

newly_found = self._bisect(paths)

993

994

while newly_found:

995

# Directories that need to be read

996

pending_dirs = set()

997

paths_to_search = set()

998

for entry_list in newly_found.itervalues():

999

for dir_name_id, trees_info in entry_list:

1000

found[dir_name_id] = trees_info

1001

found_dir_names.add(dir_name_id[:2])

1002

is_dir = False

1003

for tree_info in trees_info:

1004

minikind = tree_info[0]

1005

if minikind == 'd':

1006

if is_dir:

1007

# We already processed this one as a directory,

1008

# we don't need to do the extra work again.

1009

continue

1010

subdir, name, file_id = dir_name_id

1011

path = osutils.pathjoin(subdir, name)

1012

is_dir = True

1013

if path not in processed_dirs:

1014

pending_dirs.add(path)

1015

elif minikind == 'r':

1016

# Rename, we need to directly search the target

1017

# which is contained in the fingerprint column

1018

dir_name = osutils.split(tree_info[1])

1019

if dir_name[0] in pending_dirs:

1020

# This entry will be found in the dir search

1021

continue

1022

if dir_name not in found_dir_names:

1023

paths_to_search.add(tree_info[1])

1024

# Now we have a list of paths to look for directly, and

1025

# directory blocks that need to be read.

1026

# newly_found is mixing the keys between (dir, name) and path

1027

# entries, but that is okay, because we only really care about the

1028

# targets.

1029

newly_found = self._bisect(sorted(paths_to_search))

1030

newly_found.update(self._bisect_dirblocks(sorted(pending_dirs)))

1031

processed_dirs.update(pending_dirs)

1032

return found

1033

1034

def _discard_merge_parents(self):

1035

"""Discard any parents trees beyond the first.

1036

1037

Note that if this fails the dirstate is corrupted.

1038

1039

After this function returns the dirstate contains 2 trees, neither of

1040

which are ghosted.

1041

"""

1042

self._read_header_if_needed()

1043

parents = self.get_parent_ids()

1044

if len(parents) < 1:

1045

return

1046

# only require all dirblocks if we are doing a full-pass removal.

1047

self._read_dirblocks_if_needed()

1048

dead_patterns = set([('a', 'r'), ('a', 'a'), ('r', 'r'), ('r', 'a')])

1049

def iter_entries_removable():

1050

for block in self._dirblocks:

1051

deleted_positions = []

1052

for pos, entry in enumerate(block[1]):

1053

yield entry

1054

if (entry[1][0][0], entry[1][1][0]) in dead_patterns:

1055

deleted_positions.append(pos)

1056

if deleted_positions:

1057

if len(deleted_positions) == len(block[1]):

1058

del block[1][:]

1059

else:

1060

for pos in reversed(deleted_positions):

1061

del block[1][pos]

1062

# if the first parent is a ghost:

1063

if parents[0] in self.get_ghosts():

1064

empty_parent = [DirState.NULL_PARENT_DETAILS]

1065

for entry in iter_entries_removable():

1066

entry[1][1:] = empty_parent

1067

else:

1068

for entry in iter_entries_removable():

1069

del entry[1][2:]

1070

1071

self._ghosts = []

1072

self._parents = [parents[0]]

1073

self._mark_modified(header_modified=True)

1074

1075

def _empty_parent_info(self):

1076

return [DirState.NULL_PARENT_DETAILS] * (len(self._parents) -

1077

len(self._ghosts))

1078

1079

def _ensure_block(self, parent_block_index, parent_row_index, dirname):

1080

"""Ensure a block for dirname exists.

1081

1082

This function exists to let callers which know that there is a

1083

directory dirname ensure that the block for it exists. This block can

1084

fail to exist because of demand loading, or because a directory had no

1085

children. In either case it is not an error. It is however an error to

1086

call this if there is no parent entry for the directory, and thus the

1087

function requires the coordinates of such an entry to be provided.

1088

1089

The root row is special cased and can be indicated with a parent block

1090

and row index of -1

1091

1092

:param parent_block_index: The index of the block in which dirname's row

1093

exists.

1094

:param parent_row_index: The index in the parent block where the row

1095

exists.

1096

:param dirname: The utf8 dirname to ensure there is a block for.

1097

:return: The index for the block.

1098

"""

1099

if dirname == '' and parent_row_index == 0 and parent_block_index == 0:

1100

# This is the signature of the root row, and the

1101

# contents-of-root row is always index 1

1102

return 1

1103

# the basename of the directory must be the end of its full name.

1104

if not (parent_block_index == -1 and

1105

parent_block_index == -1 and dirname == ''):

1106

if not dirname.endswith(

1107

self._dirblocks[parent_block_index][1][parent_row_index][0][1]):

1108

raise AssertionError("bad dirname %r" % dirname)

1109

block_index, present = self._find_block_index_from_key((dirname, '', ''))

1110

if not present:

1111

## In future, when doing partial parsing, this should load and

1112

# populate the entire block.

1113

self._dirblocks.insert(block_index, (dirname, []))

1114

return block_index

1115

1116

def _entries_to_current_state(self, new_entries):

1117

"""Load new_entries into self.dirblocks.

1118

1119

Process new_entries into the current state object, making them the active

1120

state. The entries are grouped together by directory to form dirblocks.

1121

1122

:param new_entries: A sorted list of entries. This function does not sort

1123

to prevent unneeded overhead when callers have a sorted list already.

1124

:return: Nothing.

1125

"""

1126

if new_entries[0][0][0:2] != ('', ''):

1127

raise AssertionError(

1128

"Missing root row %r" % (new_entries[0][0],))

1129

# The two blocks here are deliberate: the root block and the

1130

# contents-of-root block.

1131

self._dirblocks = [('', []), ('', [])]

1132

current_block = self._dirblocks[0][1]

1133

current_dirname = ''

1134

root_key = ('', '')

1135

append_entry = current_block.append

1136

for entry in new_entries:

1137

if entry[0][0] != current_dirname:

1138

# new block - different dirname

1139

current_block = []

1140

current_dirname = entry[0][0]

1141

self._dirblocks.append((current_dirname, current_block))

1142

append_entry = current_block.append

1143

# append the entry to the current block

1144

append_entry(entry)

1145

self._split_root_dirblock_into_contents()

1146

1147

def _split_root_dirblock_into_contents(self):

1148

"""Split the root dirblocks into root and contents-of-root.

1149

1150

After parsing by path, we end up with root entries and contents-of-root

1151

entries in the same block. This loop splits them out again.

1152

"""

1153

# The above loop leaves the "root block" entries mixed with the

1154

# "contents-of-root block". But we don't want an if check on

1155

# all entries, so instead we just fix it up here.

1156

if self._dirblocks[1] != ('', []):

1157

raise ValueError("bad dirblock start %r" % (self._dirblocks[1],))

1158

root_block = []

1159

contents_of_root_block = []

1160

for entry in self._dirblocks[0][1]:

1161

if not entry[0][1]: # This is a root entry

1162

root_block.append(entry)

1163

else:

1164

contents_of_root_block.append(entry)

1165

self._dirblocks[0] = ('', root_block)

1166

self._dirblocks[1] = ('', contents_of_root_block)

1167

1168

def _entries_for_path(self, path):

1169

"""Return a list with all the entries that match path for all ids."""

1170

dirname, basename = os.path.split(path)

1171

key = (dirname, basename, '')

1172

block_index, present = self._find_block_index_from_key(key)

1173

if not present:

1174

# the block which should contain path is absent.

1175

return []

1176

result = []

1177

block = self._dirblocks[block_index][1]

1178

entry_index, _ = self._find_entry_index(key, block)

1179

# we may need to look at multiple entries at this path: walk while the specific_files match.

1180

while (entry_index < len(block) and

1181

block[entry_index][0][0:2] == key[0:2]):

1182

result.append(block[entry_index])

1183

entry_index += 1

1184

return result

1185

1186

def _entry_to_line(self, entry):

1187

"""Serialize entry to a NULL delimited line ready for _get_output_lines.

1188

1189

:param entry: An entry_tuple as defined in the module docstring.

1190

"""

1191

entire_entry = list(entry[0])

1192

for tree_number, tree_data in enumerate(entry[1]):

1193

# (minikind, fingerprint, size, executable, tree_specific_string)

1194

entire_entry.extend(tree_data)

1195

# 3 for the key, 5 for the fields per tree.

1196

tree_offset = 3 + tree_number * 5

1197

# minikind

1198

entire_entry[tree_offset + 0] = tree_data[0]

1199

# size

1200

entire_entry[tree_offset + 2] = str(tree_data[2])

1201

# executable

1202

entire_entry[tree_offset + 3] = DirState._to_yesno[tree_data[3]]

1203

return '\0'.join(entire_entry)

1204

1205

def _fields_per_entry(self):

1206

"""How many null separated fields should be in each entry row.

1207

1208

Each line now has an extra '\n' field which is not used

1209

so we just skip over it

1210

entry size:

1211

3 fields for the key

1212

+ number of fields per tree_data (5) * tree count

1213

+ newline

1214

"""

1215

tree_count = 1 + self._num_present_parents()

1216

return 3 + 5 * tree_count + 1

1217

1218

def _find_block(self, key, add_if_missing=False):

1219

"""Return the block that key should be present in.

1220

1221

:param key: A dirstate entry key.

1222

:return: The block tuple.

1223

"""

1224

block_index, present = self._find_block_index_from_key(key)

1225

if not present:

1226

if not add_if_missing:

1227

# check to see if key is versioned itself - we might want to

1228

# add it anyway, because dirs with no entries dont get a

1229

# dirblock at parse time.

1230

# This is an uncommon branch to take: most dirs have children,

1231

# and most code works with versioned paths.

1232

parent_base, parent_name = osutils.split(key[0])

1233

if not self._get_block_entry_index(parent_base, parent_name, 0)[3]:

1234

# some parent path has not been added - its an error to add

1235

# this child

1236

raise errors.NotVersionedError(key[0:2], str(self))

1237

self._dirblocks.insert(block_index, (key[0], []))

1238

return self._dirblocks[block_index]

1239

1240

def _find_block_index_from_key(self, key):

1241

"""Find the dirblock index for a key.

1242

1243

:return: The block index, True if the block for the key is present.

1244

"""

1245

if key[0:2] == ('', ''):

1246

return 0, True

1247

try:

1248

if (self._last_block_index is not None and

1249

self._dirblocks[self._last_block_index][0] == key[0]):

1250

return self._last_block_index, True

1251

except IndexError:

1252

pass

1253

block_index = bisect_dirblock(self._dirblocks, key[0], 1,

1254

cache=self._split_path_cache)

1255

# _right returns one-past-where-key is so we have to subtract

1256

# one to use it. we use _right here because there are two

1257

# '' blocks - the root, and the contents of root

1258

# we always have a minimum of 2 in self._dirblocks: root and

1259

# root-contents, and for '', we get 2 back, so this is

1260

# simple and correct:

1261

present = (block_index < len(self._dirblocks) and

1262

self._dirblocks[block_index][0] == key[0])

1263

self._last_block_index = block_index

1264

# Reset the entry index cache to the beginning of the block.

1265

self._last_entry_index = -1

1266

return block_index, present

1267

1268

def _find_entry_index(self, key, block):

1269

"""Find the entry index for a key in a block.

1270

1271

:return: The entry index, True if the entry for the key is present.

1272

"""

1273

len_block = len(block)

1274

try:

1275

if self._last_entry_index is not None:

1276

# mini-bisect here.

1277

entry_index = self._last_entry_index + 1

1278

# A hit is when the key is after the last slot, and before or

1279

# equal to the next slot.

1280

if ((entry_index > 0 and block[entry_index - 1][0] < key) and

1281

key <= block[entry_index][0]):

1282

self._last_entry_index = entry_index

1283

present = (block[entry_index][0] == key)

1284

return entry_index, present

1285

except IndexError:

1286

pass

1287

entry_index = bisect.bisect_left(block, (key, []))

1288

present = (entry_index < len_block and

1289

block[entry_index][0] == key)

1290

self._last_entry_index = entry_index

1291

return entry_index, present

1292

1293

@staticmethod

1294

def from_tree(tree, dir_state_filename, sha1_provider=None):

1295

"""Create a dirstate from a bzr Tree.

1296

1297

:param tree: The tree which should provide parent information and

1298

inventory ids.

1299

:param sha1_provider: an object meeting the SHA1Provider interface.

1300

If None, a DefaultSHA1Provider is used.

1301

:return: a DirState object which is currently locked for writing.

1302

(it was locked by DirState.initialize)

1303

"""

1304

result = DirState.initialize(dir_state_filename,

1305

sha1_provider=sha1_provider)

1306

try:

1307

tree.lock_read()

1308

try:

1309

parent_ids = tree.get_parent_ids()

1310

num_parents = len(parent_ids)

1311

parent_trees = []

1312

for parent_id in parent_ids:

1313

parent_tree = tree.branch.repository.revision_tree(parent_id)

1314

parent_trees.append((parent_id, parent_tree))

1315

parent_tree.lock_read()

1316

result.set_parent_trees(parent_trees, [])

1317

result.set_state_from_inventory(tree.inventory)

1318

finally:

1319

for revid, parent_tree in parent_trees:

1320

parent_tree.unlock()

1321

tree.unlock()

1322

except:

1323

# The caller won't have a chance to unlock this, so make sure we

1324

# cleanup ourselves

1325

result.unlock()

1326

raise

1327

return result

1328

1329

def update_by_delta(self, delta):

1330

"""Apply an inventory delta to the dirstate for tree 0

1331

1332

This is the workhorse for apply_inventory_delta in dirstate based

1333

trees.

1334

1335

:param delta: An inventory delta. See Inventory.apply_delta for

1336

details.

1337

"""

1338

self._read_dirblocks_if_needed()

1339

encode = cache_utf8.encode

1340

insertions = {}

1341

removals = {}

1342

# Accumulate parent references (path_utf8, id), to check for parentless

1343

# items or items placed under files/links/tree-references. We get

1344

# references from every item in the delta that is not a deletion and

1345

# is not itself the root.

1346

parents = set()

1347

# Added ids must not be in the dirstate already. This set holds those

1348

# ids.

1349

new_ids = set()

1350

# This loop transforms the delta to single atomic operations that can

1351

# be executed and validated.

1352

for old_path, new_path, file_id, inv_entry in sorted(

1353

inventory._check_delta_unique_old_paths(

1354

inventory._check_delta_unique_new_paths(

1355

inventory._check_delta_ids_match_entry(

1356

inventory._check_delta_ids_are_valid(

1357

inventory._check_delta_new_path_entry_both_or_None(delta))))),

1358

reverse=True):

1359

if (file_id in insertions) or (file_id in removals):

1360

raise errors.InconsistentDelta(old_path or new_path, file_id,

1361

"repeated file_id")

1362

if old_path is not None:

1363

old_path = old_path.encode('utf-8')

1364

removals[file_id] = old_path

1365

else:

1366

new_ids.add(file_id)

1367

if new_path is not None:

1368

if inv_entry is None:

1369

raise errors.InconsistentDelta(new_path, file_id,

1370

"new_path with no entry")

1371

new_path = new_path.encode('utf-8')

1372

dirname_utf8, basename = osutils.split(new_path)

1373

if basename:

1374

parents.add((dirname_utf8, inv_entry.parent_id))

1375

key = (dirname_utf8, basename, file_id)

1376

minikind = DirState._kind_to_minikind[inv_entry.kind]

1377

if minikind == 't':

1378

fingerprint = inv_entry.reference_revision or ''

1379

else:

1380

fingerprint = ''

1381

insertions[file_id] = (key, minikind, inv_entry.executable,

1382

fingerprint, new_path)

1383

# Transform moves into delete+add pairs

1384

if None not in (old_path, new_path):

1385

for child in self._iter_child_entries(0, old_path):

1386

if child[0][2] in insertions or child[0][2] in removals:

1387

continue

1388

child_dirname = child[0][0]

1389

child_basename = child[0][1]

1390

minikind = child[1][0][0]

1391

fingerprint = child[1][0][4]

1392

executable = child[1][0][3]

1393

old_child_path = osutils.pathjoin(child_dirname,

1394

child_basename)

1395

removals[child[0][2]] = old_child_path

1396

child_suffix = child_dirname[len(old_path):]

1397

new_child_dirname = (new_path + child_suffix)

1398

key = (new_child_dirname, child_basename, child[0][2])

1399

new_child_path = osutils.pathjoin(new_child_dirname,

1400

child_basename)

1401

insertions[child[0][2]] = (key, minikind, executable,

1402

fingerprint, new_child_path)

1403

self._check_delta_ids_absent(new_ids, delta, 0)

1404

try:

1405

self._apply_removals(removals.iteritems())

1406

self._apply_insertions(insertions.values())

1407

# Validate parents

1408

self._after_delta_check_parents(parents, 0)

1409

except errors.BzrError, e:

1410

self._changes_aborted = True

1411

if 'integrity error' not in str(e):

1412

raise

1413

# _get_entry raises BzrError when a request is inconsistent; we

1414

# want such errors to be shown as InconsistentDelta - and that

1415

# fits the behaviour we trigger.

1416

raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")

1417

1418

def _apply_removals(self, removals):

1419

for file_id, path in sorted(removals, reverse=True,

1420

key=operator.itemgetter(1)):

1421

dirname, basename = osutils.split(path)

1422

block_i, entry_i, d_present, f_present = \

1423

self._get_block_entry_index(dirname, basename, 0)

1424

try:

1425

entry = self._dirblocks[block_i][1][entry_i]

1426

except IndexError:

1427

self._changes_aborted = True

1428

raise errors.InconsistentDelta(path, file_id,

1429

"Wrong path for old path.")

1430

if not f_present or entry[1][0][0] in 'ar':

1431

self._changes_aborted = True

1432

raise errors.InconsistentDelta(path, file_id,

1433

"Wrong path for old path.")

1434

if file_id != entry[0][2]:

1435

self._changes_aborted = True

1436

raise errors.InconsistentDelta(path, file_id,

1437

"Attempt to remove path has wrong id - found %r."

1438

% entry[0][2])

1439

self._make_absent(entry)

1440

# See if we have a malformed delta: deleting a directory must not

1441

# leave crud behind. This increases the number of bisects needed

1442

# substantially, but deletion or renames of large numbers of paths

1443

# is rare enough it shouldn't be an issue (famous last words?) RBC

1444

# 20080730.

1445

block_i, entry_i, d_present, f_present = \

1446

self._get_block_entry_index(path, '', 0)

1447

if d_present:

1448

# The dir block is still present in the dirstate; this could

1449

# be due to it being in a parent tree, or a corrupt delta.

1450

for child_entry in self._dirblocks[block_i][1]:

1451

if child_entry[1][0][0] not in ('r', 'a'):

1452

self._changes_aborted = True

1453

raise errors.InconsistentDelta(path, entry[0][2],

1454

"The file id was deleted but its children were "

1455

"not deleted.")

1456

1457

def _apply_insertions(self, adds):

1458

try:

1459

for key, minikind, executable, fingerprint, path_utf8 in sorted(adds):

1460

self.update_minimal(key, minikind, executable, fingerprint,

1461

path_utf8=path_utf8)

1462

except errors.NotVersionedError:

1463

self._changes_aborted = True

1464

raise errors.InconsistentDelta(path_utf8.decode('utf8'), key[2],

1465

"Missing parent")

1466

1467

def update_basis_by_delta(self, delta, new_revid):

1468

"""Update the parents of this tree after a commit.

1469

1470

This gives the tree one parent, with revision id new_revid. The

1471

inventory delta is applied to the current basis tree to generate the

1472

inventory for the parent new_revid, and all other parent trees are

1473

discarded.

1474

1475

Note that an exception during the operation of this method will leave

1476

the dirstate in a corrupt state where it should not be saved.

1477

1478

Finally, we expect all changes to be synchronising the basis tree with

1479

the working tree.

1480

1481

:param new_revid: The new revision id for the trees parent.

1482

:param delta: An inventory delta (see apply_inventory_delta) describing

1483

the changes from the current left most parent revision to new_revid.

1484

"""

1485

self._read_dirblocks_if_needed()

1486

self._discard_merge_parents()

1487

if self._ghosts != []:

1488

raise NotImplementedError(self.update_basis_by_delta)

1489

if len(self._parents) == 0:

1490

# setup a blank tree, the most simple way.

1491

empty_parent = DirState.NULL_PARENT_DETAILS

1492

for entry in self._iter_entries():

1493

entry[1].append(empty_parent)

1494

self._parents.append(new_revid)

1495

1496

self._parents[0] = new_revid

1497

1498

delta = sorted(delta, reverse=True)

1499

adds = []

1500

changes = []

1501

deletes = []

1502

# The paths this function accepts are unicode and must be encoded as we

1503

# go.

1504

encode = cache_utf8.encode

1505

inv_to_entry = self._inv_entry_to_details

1506

# delta is now (deletes, changes), (adds) in reverse lexographical

1507

# order.

1508

# deletes in reverse lexographic order are safe to process in situ.

1509

# renames are not, as a rename from any path could go to a path

1510

# lexographically lower, so we transform renames into delete, add pairs,

1511

# expanding them recursively as needed.

1512

# At the same time, to reduce interface friction we convert the input

1513

# inventory entries to dirstate.

1514

root_only = ('', '')

1515

# Accumulate parent references (path_utf8, id), to check for parentless

1516

# items or items placed under files/links/tree-references. We get

1517

# references from every item in the delta that is not a deletion and

1518

# is not itself the root.

1519

parents = set()

1520

# Added ids must not be in the dirstate already. This set holds those

1521

# ids.

1522

new_ids = set()

1523

for old_path, new_path, file_id, inv_entry in delta:

1524

if inv_entry is not None and file_id != inv_entry.file_id:

1525

raise errors.InconsistentDelta(new_path, file_id,

1526

"mismatched entry file_id %r" % inv_entry)

1527

if new_path is not None:

1528

if inv_entry is None:

1529

raise errors.InconsistentDelta(new_path, file_id,

1530

"new_path with no entry")

1531

new_path_utf8 = encode(new_path)

1532

# note the parent for validation

1533

dirname_utf8, basename_utf8 = osutils.split(new_path_utf8)

1534

if basename_utf8:

1535

parents.add((dirname_utf8, inv_entry.parent_id))

1536

if old_path is None:

1537

adds.append((None, encode(new_path), file_id,

1538

inv_to_entry(inv_entry), True))

1539

new_ids.add(file_id)

1540

elif new_path is None:

1541

deletes.append((encode(old_path), None, file_id, None, True))

1542

elif (old_path, new_path) != root_only:

1543

# Renames:

1544

# Because renames must preserve their children we must have

1545

# processed all relocations and removes before hand. The sort

1546

# order ensures we've examined the child paths, but we also

1547

# have to execute the removals, or the split to an add/delete

1548

# pair will result in the deleted item being reinserted, or

1549

# renamed items being reinserted twice - and possibly at the

1550

# wrong place. Splitting into a delete/add pair also simplifies

1551

# the handling of entries with ('f', ...), ('r' ...) because

1552

# the target of the 'r' is old_path here, and we add that to

1553

# deletes, meaning that the add handler does not need to check

1554

# for 'r' items on every pass.

1555

self._update_basis_apply_deletes(deletes)

1556

deletes = []

1557

# Split into an add/delete pair recursively.

1558

adds.append((None, new_path_utf8, file_id,

1559

inv_to_entry(inv_entry), False))

1560

# Expunge deletes that we've seen so that deleted/renamed

1561

# children of a rename directory are handled correctly.

1562

new_deletes = reversed(list(self._iter_child_entries(1,

1563

encode(old_path))))

1564

# Remove the current contents of the tree at orig_path, and

1565

# reinsert at the correct new path.

1566

for entry in new_deletes:

1567

if entry[0][0]:

1568

source_path = entry[0][0] + '/' + entry[0][1]

1569

else:

1570

source_path = entry[0][1]

1571

if new_path_utf8:

1572

target_path = new_path_utf8 + source_path[len(old_path):]

1573

else:

1574

if old_path == '':

1575

raise AssertionError("cannot rename directory to"

1576

" itself")

1577

target_path = source_path[len(old_path) + 1:]

1578

adds.append((None, target_path, entry[0][2], entry[1][1], False))

1579

deletes.append(

1580

(source_path, target_path, entry[0][2], None, False))

1581

deletes.append(

1582

(encode(old_path), new_path, file_id, None, False))

1583

else:

1584

# changes to just the root should not require remove/insertion

1585

# of everything.

1586

changes.append((encode(old_path), encode(new_path), file_id,

1587

inv_to_entry(inv_entry)))

1588

self._check_delta_ids_absent(new_ids, delta, 1)

1589

try:

1590

# Finish expunging deletes/first half of renames.

1591

self._update_basis_apply_deletes(deletes)

1592

# Reinstate second half of renames and new paths.

1593

self._update_basis_apply_adds(adds)

1594

# Apply in-situ changes.

1595

self._update_basis_apply_changes(changes)

1596

# Validate parents

1597

self._after_delta_check_parents(parents, 1)

1598

except errors.BzrError, e:

1599

self._changes_aborted = True

1600

if 'integrity error' not in str(e):

1601

raise

1602

# _get_entry raises BzrError when a request is inconsistent; we

1603

# want such errors to be shown as InconsistentDelta - and that

1604

# fits the behaviour we trigger. Partof this is driven by dirstate

1605

# only supporting deltas that turn the basis into a closer fit to

1606

# the active tree.

1607

raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")

1608

1609

self._mark_modified(header_modified=True)

1610

self._id_index = None

1611

return

1612

1613

def _check_delta_ids_absent(self, new_ids, delta, tree_index):

1614

"""Check that none of the file_ids in new_ids are present in a tree."""

1615

if not new_ids:

1616

return

1617

id_index = self._get_id_index()

1618

for file_id in new_ids:

1619

for key in id_index.get(file_id, ()):

1620

block_i, entry_i, d_present, f_present = \

1621

self._get_block_entry_index(key[0], key[1], tree_index)

1622

if not f_present:

1623

# In a different tree

1624

continue

1625

entry = self._dirblocks[block_i][1][entry_i]

1626

if entry[0][2] != file_id:

1627

# Different file_id, so not what we want.

1628

continue

1629

# NB: No changes made before this helper is called, so no need

1630

# to set the _changes_aborted flag.

1631

raise errors.InconsistentDelta(

1632

("%s/%s" % key[0:2]).decode('utf8'), file_id,

1633

"This file_id is new in the delta but already present in "

1634

"the target")

1635

1636

def _update_basis_apply_adds(self, adds):

1637

"""Apply a sequence of adds to tree 1 during update_basis_by_delta.

1638

1639

They may be adds, or renames that have been split into add/delete

1640

pairs.

1641

1642

:param adds: A sequence of adds. Each add is a tuple:

1643

(None, new_path_utf8, file_id, (entry_details), real_add). real_add

1644

is False when the add is the second half of a remove-and-reinsert

1645

pair created to handle renames and deletes.

1646

"""

1647

# Adds are accumulated partly from renames, so can be in any input

1648

# order - sort it.

1649

adds.sort()

1650

# adds is now in lexographic order, which places all parents before

1651

# their children, so we can process it linearly.

1652

absent = 'ar'

1653

for old_path, new_path, file_id, new_details, real_add in adds:

1654

# the entry for this file_id must be in tree 0.

1655

entry = self._get_entry(0, file_id, new_path)

1656

if entry[0] is None or entry[0][2] != file_id:

1657

self._changes_aborted = True

1658

raise errors.InconsistentDelta(new_path, file_id,

1659

'working tree does not contain new entry')

1660

if real_add and entry[1][1][0] not in absent:

1661

self._changes_aborted = True

1662

raise errors.InconsistentDelta(new_path, file_id,

1663

'The entry was considered to be a genuinely new record,'

1664

' but there was already an old record for it.')

1665

# We don't need to update the target of an 'r' because the handling

1666

# of renames turns all 'r' situations into a delete at the original

1667

# location.

1668

entry[1][1] = new_details

1669

1670

def _update_basis_apply_changes(self, changes):

1671

"""Apply a sequence of changes to tree 1 during update_basis_by_delta.

1672

1673

:param adds: A sequence of changes. Each change is a tuple:

1674

(path_utf8, path_utf8, file_id, (entry_details))

1675

"""

1676

absent = 'ar'

1677

for old_path, new_path, file_id, new_details in changes:

1678

# the entry for this file_id must be in tree 0.

1679

entry = self._get_entry(0, file_id, new_path)

1680

if entry[0] is None or entry[0][2] != file_id:

1681

self._changes_aborted = True

1682

raise errors.InconsistentDelta(new_path, file_id,

1683

'working tree does not contain new entry')

1684

if (entry[1][0][0] in absent or

1685

entry[1][1][0] in absent):

1686

self._changes_aborted = True

1687

raise errors.InconsistentDelta(new_path, file_id,

1688

'changed considered absent')

1689

entry[1][1] = new_details

1690

1691

def _update_basis_apply_deletes(self, deletes):

1692

"""Apply a sequence of deletes to tree 1 during update_basis_by_delta.

1693

1694

They may be deletes, or renames that have been split into add/delete

1695

pairs.

1696

1697

:param deletes: A sequence of deletes. Each delete is a tuple:

1698

(old_path_utf8, new_path_utf8, file_id, None, real_delete).

1699

real_delete is True when the desired outcome is an actual deletion

1700

rather than the rename handling logic temporarily deleting a path

1701

during the replacement of a parent.

1702

"""

1703

null = DirState.NULL_PARENT_DETAILS

1704

for old_path, new_path, file_id, _, real_delete in deletes:

1705

if real_delete != (new_path is None):

1706

self._changes_aborted = True

1707

raise AssertionError("bad delete delta")

1708

# the entry for this file_id must be in tree 1.

1709

dirname, basename = osutils.split(old_path)

1710

block_index, entry_index, dir_present, file_present = \

1711

self._get_block_entry_index(dirname, basename, 1)

1712

if not file_present:

1713

self._changes_aborted = True

1714

raise errors.InconsistentDelta(old_path, file_id,

1715

'basis tree does not contain removed entry')

1716

entry = self._dirblocks[block_index][1][entry_index]

1717

if entry[0][2] != file_id:

1718

self._changes_aborted = True

1719

raise errors.InconsistentDelta(old_path, file_id,

1720

'mismatched file_id in tree 1')

1721

if real_delete:

1722

if entry[1][0][0] != 'a':

1723

self._changes_aborted = True

1724

raise errors.InconsistentDelta(old_path, file_id,

1725

'This was marked as a real delete, but the WT state'

1726

' claims that it still exists and is versioned.')

1727

del self._dirblocks[block_index][1][entry_index]

1728

else:

1729

if entry[1][0][0] == 'a':

1730

self._changes_aborted = True

1731

raise errors.InconsistentDelta(old_path, file_id,

1732

'The entry was considered a rename, but the source path'

1733

' is marked as absent.')

1734

# For whatever reason, we were asked to rename an entry

1735

# that was originally marked as deleted. This could be

1736

# because we are renaming the parent directory, and the WT

1737

# current state has the file marked as deleted.

1738

elif entry[1][0][0] == 'r':

1739

# implement the rename

1740

del self._dirblocks[block_index][1][entry_index]

1741

else:

1742

# it is being resurrected here, so blank it out temporarily.

1743

self._dirblocks[block_index][1][entry_index][1][1] = null

1744

1745

def _after_delta_check_parents(self, parents, index):

1746

"""Check that parents required by the delta are all intact.

1747

1748

:param parents: An iterable of (path_utf8, file_id) tuples which are

1749

required to be present in tree 'index' at path_utf8 with id file_id

1750

and be a directory.

1751

:param index: The column in the dirstate to check for parents in.

1752

"""

1753

for dirname_utf8, file_id in parents:

1754

# Get the entry - the ensures that file_id, dirname_utf8 exists and

1755

# has the right file id.

1756

entry = self._get_entry(index, file_id, dirname_utf8)

1757

if entry[1] is None:

1758

self._changes_aborted = True

1759

raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),

1760

file_id, "This parent is not present.")

1761

# Parents of things must be directories

1762

if entry[1][index][0] != 'd':

1763

self._changes_aborted = True

1764

raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),

1765

file_id, "This parent is not a directory.")

1766

1767

def _observed_sha1(self, entry, sha1, stat_value,

1768

_stat_to_minikind=_stat_to_minikind, _pack_stat=pack_stat):

1769

"""Note the sha1 of a file.

1770

1771

:param entry: The entry the sha1 is for.

1772

:param sha1: The observed sha1.

1773

:param stat_value: The os.lstat for the file.

1774

"""

1775

try:

1776

minikind = _stat_to_minikind[stat_value.st_mode & 0170000]

1777

except KeyError:

1778

# Unhandled kind

1779

return None

1780

packed_stat = _pack_stat(stat_value)

1781

if minikind == 'f':

1782

if self._cutoff_time is None:

1783

self._sha_cutoff_time()

1784

if (stat_value.st_mtime < self._cutoff_time

1785

and stat_value.st_ctime < self._cutoff_time):

1786

entry[1][0] = ('f', sha1, stat_value.st_size, entry[1][0][3],

1787

packed_stat)

1788

self._mark_modified([entry])

1789

1790

def _sha_cutoff_time(self):

1791

"""Return cutoff time.

1792

1793

Files modified more recently than this time are at risk of being

1794

undetectably modified and so can't be cached.

1795

"""

1796

# Cache the cutoff time as long as we hold a lock.

1797

# time.time() isn't super expensive (approx 3.38us), but

1798

# when you call it 50,000 times it adds up.

1799

# For comparison, os.lstat() costs 7.2us if it is hot.

1800

self._cutoff_time = int(time.time()) - 3

1801

return self._cutoff_time

1802

1803

def _lstat(self, abspath, entry):

1804

"""Return the os.lstat value for this path."""

1805

return os.lstat(abspath)

1806

1807

def _sha1_file_and_mutter(self, abspath):

1808

# when -Dhashcache is turned on, this is monkey-patched in to log

1809

# file reads

1810

trace.mutter("dirstate sha1 " + abspath)

1811

return self._sha1_provider.sha1(abspath)

1812

1813

def _is_executable(self, mode, old_executable):

1814

"""Is this file executable?"""

1815

return bool(S_IEXEC & mode)

1816

1817

def _is_executable_win32(self, mode, old_executable):

1818

"""On win32 the executable bit is stored in the dirstate."""

1819

return old_executable

1820

1821

if sys.platform == 'win32':

1822

_is_executable = _is_executable_win32

1823

1824

def _read_link(self, abspath, old_link):

1825

"""Read the target of a symlink"""

1826

# TODO: jam 200700301 On Win32, this could just return the value

1827

# already in memory. However, this really needs to be done at a

1828

# higher level, because there either won't be anything on disk,

1829

# or the thing on disk will be a file.

1830

fs_encoding = osutils._fs_enc

1831

if isinstance(abspath, unicode):

1832

# abspath is defined as the path to pass to lstat. readlink is

1833

# buggy in python < 2.6 (it doesn't encode unicode path into FS

1834

# encoding), so we need to encode ourselves knowing that unicode

1835

# paths are produced by UnicodeDirReader on purpose.

1836

abspath = abspath.encode(fs_encoding)

1837

target = os.readlink(abspath)

1838

if fs_encoding not in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968'):

1839

# Change encoding if needed

1840

target = target.decode(fs_encoding).encode('UTF-8')

1841

return target

1842

1843

def get_ghosts(self):

1844

"""Return a list of the parent tree revision ids that are ghosts."""

1845

self._read_header_if_needed()

1846

return self._ghosts

1847

1848

def get_lines(self):

1849

"""Serialise the entire dirstate to a sequence of lines."""

1850

if (self._header_state == DirState.IN_MEMORY_UNMODIFIED and

1851

self._dirblock_state == DirState.IN_MEMORY_UNMODIFIED):

1852

# read what's on disk.

1853

self._state_file.seek(0)

1854

return self._state_file.readlines()

1855

lines = []

1856

lines.append(self._get_parents_line(self.get_parent_ids()))

1857

lines.append(self._get_ghosts_line(self._ghosts))

1858

lines.extend(self._get_entry_lines())

1859

return self._get_output_lines(lines)

1860

1861

def _get_ghosts_line(self, ghost_ids):

1862

"""Create a line for the state file for ghost information."""

1863

return '\0'.join([str(len(ghost_ids))] + ghost_ids)

1864

1865

def _get_parents_line(self, parent_ids):

1866

"""Create a line for the state file for parents information."""

1867

return '\0'.join([str(len(parent_ids))] + parent_ids)

1868

1869

def _get_entry_lines(self):

1870

"""Create lines for entries."""

1871

return map(self._entry_to_line, self._iter_entries())

1872

1873

def _get_fields_to_entry(self):

1874

"""Get a function which converts entry fields into a entry record.

1875

1876

This handles size and executable, as well as parent records.

1877

1878

:return: A function which takes a list of fields, and returns an

1879

appropriate record for storing in memory.

1880

"""

1881

# This is intentionally unrolled for performance

1882

num_present_parents = self._num_present_parents()

1883

if num_present_parents == 0:

1884

def fields_to_entry_0_parents(fields, _int=int):

1885

path_name_file_id_key = (fields[0], fields[1], fields[2])

1886

return (path_name_file_id_key, [

1887

( # Current tree

1888

fields[3], # minikind

1889

fields[4], # fingerprint

1890

_int(fields[5]), # size

1891

fields[6] == 'y', # executable

1892

fields[7], # packed_stat or revision_id

1893

)])

1894

return fields_to_entry_0_parents

1895

elif num_present_parents == 1:

1896

def fields_to_entry_1_parent(fields, _int=int):

1897

path_name_file_id_key = (fields[0], fields[1], fields[2])

1898

return (path_name_file_id_key, [

1899

( # Current tree

1900

fields[3], # minikind

1901

fields[4], # fingerprint

1902

_int(fields[5]), # size

1903

fields[6] == 'y', # executable

1904

fields[7], # packed_stat or revision_id

1905

1906

( # Parent 1

1907

fields[8], # minikind

1908

fields[9], # fingerprint

1909

_int(fields[10]), # size

1910

fields[11] == 'y', # executable

1911

fields[12], # packed_stat or revision_id

1912

1913

])

1914

return fields_to_entry_1_parent

1915

elif num_present_parents == 2:

1916

def fields_to_entry_2_parents(fields, _int=int):

1917

path_name_file_id_key = (fields[0], fields[1], fields[2])

1918

return (path_name_file_id_key, [

1919

( # Current tree

1920

fields[3], # minikind

1921

fields[4], # fingerprint

1922

_int(fields[5]), # size

1923

fields[6] == 'y', # executable

1924

fields[7], # packed_stat or revision_id

1925

1926

( # Parent 1

1927

fields[8], # minikind

1928

fields[9], # fingerprint

1929

_int(fields[10]), # size

1930

fields[11] == 'y', # executable

1931

fields[12], # packed_stat or revision_id

1932

1933

( # Parent 2

1934

fields[13], # minikind

1935

fields[14], # fingerprint

1936

_int(fields[15]), # size

1937

fields[16] == 'y', # executable

1938

fields[17], # packed_stat or revision_id

1939

1940

])

1941

return fields_to_entry_2_parents

1942

else:

1943

def fields_to_entry_n_parents(fields, _int=int):

1944

path_name_file_id_key = (fields[0], fields[1], fields[2])

1945

trees = [(fields[cur], # minikind

1946

fields[cur+1], # fingerprint

1947

_int(fields[cur+2]), # size

1948

fields[cur+3] == 'y', # executable

1949

fields[cur+4], # stat or revision_id

1950

) for cur in xrange(3, len(fields)-1, 5)]

1951

return path_name_file_id_key, trees

1952

return fields_to_entry_n_parents

1953

1954

def get_parent_ids(self):

1955

"""Return a list of the parent tree ids for the directory state."""

1956

self._read_header_if_needed()

1957

return list(self._parents)

1958

1959

def _get_block_entry_index(self, dirname, basename, tree_index):

1960

"""Get the coordinates for a path in the state structure.

1961

1962

:param dirname: The utf8 dirname to lookup.

1963

:param basename: The utf8 basename to lookup.

1964

:param tree_index: The index of the tree for which this lookup should

1965

be attempted.

1966

:return: A tuple describing where the path is located, or should be

1967

inserted. The tuple contains four fields: the block index, the row

1968

index, the directory is present (boolean), the entire path is

1969

present (boolean). There is no guarantee that either

1970

coordinate is currently reachable unless the found field for it is

1971

True. For instance, a directory not present in the searched tree

1972

may be returned with a value one greater than the current highest

1973

block offset. The directory present field will always be True when

1974

the path present field is True. The directory present field does

1975

NOT indicate that the directory is present in the searched tree,

1976

rather it indicates that there are at least some files in some

1977

tree present there.

1978

"""

1979

self._read_dirblocks_if_needed()

1980

key = dirname, basename, ''

1981

block_index, present = self._find_block_index_from_key(key)

1982

if not present:

1983

# no such directory - return the dir index and 0 for the row.

1984

return block_index, 0, False, False

1985

block = self._dirblocks[block_index][1] # access the entries only

1986

entry_index, present = self._find_entry_index(key, block)

1987

# linear search through entries at this path to find the one

1988

# requested.

1989

while entry_index < len(block) and block[entry_index][0][1] == basename:

1990

if block[entry_index][1][tree_index][0] not in 'ar':

1991

# neither absent or relocated

1992

return block_index, entry_index, True, True

1993

entry_index += 1

1994

return block_index, entry_index, True, False

1995

1996

def _get_entry(self, tree_index, fileid_utf8=None, path_utf8=None, include_deleted=False):

1997

"""Get the dirstate entry for path in tree tree_index.

1998

1999

If either file_id or path is supplied, it is used as the key to lookup.

2000

If both are supplied, the fastest lookup is used, and an error is

2001

raised if they do not both point at the same row.

2002

2003

:param tree_index: The index of the tree we wish to locate this path

2004

in. If the path is present in that tree, the entry containing its

2005

details is returned, otherwise (None, None) is returned

2006

0 is the working tree, higher indexes are successive parent

2007

trees.

2008

:param fileid_utf8: A utf8 file_id to look up.

2009

:param path_utf8: An utf8 path to be looked up.

2010

:param include_deleted: If True, and performing a lookup via

2011

fileid_utf8 rather than path_utf8, return an entry for deleted

2012

(absent) paths.

2013

:return: The dirstate entry tuple for path, or (None, None)

2014

"""

2015

self._read_dirblocks_if_needed()

2016

if path_utf8 is not None:

2017

if type(path_utf8) is not str:

2018

raise errors.BzrError('path_utf8 is not a str: %s %r'

2019

% (type(path_utf8), path_utf8))

2020

# path lookups are faster

2021

dirname, basename = osutils.split(path_utf8)

2022

block_index, entry_index, dir_present, file_present = \

2023

self._get_block_entry_index(dirname, basename, tree_index)

2024

if not file_present:

2025

return None, None

2026

entry = self._dirblocks[block_index][1][entry_index]

2027

if not (entry[0][2] and entry[1][tree_index][0] not in ('a', 'r')):

2028

raise AssertionError('unversioned entry?')

2029

if fileid_utf8:

2030

if entry[0][2] != fileid_utf8:

2031

self._changes_aborted = True

2032

raise errors.BzrError('integrity error ? : mismatching'

2033

' tree_index, file_id and path')

2034

return entry

2035

else:

2036

possible_keys = self._get_id_index().get(fileid_utf8, ())

2037

if not possible_keys:

2038

return None, None

2039

for key in possible_keys:

2040

block_index, present = \

2041

self._find_block_index_from_key(key)

2042

# strange, probably indicates an out of date

2043

# id index - for now, allow this.

2044

if not present:

2045

continue

2046

# WARNING: DO not change this code to use _get_block_entry_index

2047

# as that function is not suitable: it does not use the key

2048

# to lookup, and thus the wrong coordinates are returned.

2049

block = self._dirblocks[block_index][1]

2050

entry_index, present = self._find_entry_index(key, block)

2051

if present:

2052

entry = self._dirblocks[block_index][1][entry_index]

2053

# TODO: We might want to assert that entry[0][2] ==

2054

# fileid_utf8.

2055

if entry[1][tree_index][0] in 'fdlt':

2056

# this is the result we are looking for: the

2057

# real home of this file_id in this tree.

2058

return entry

2059

if entry[1][tree_index][0] == 'a':

2060

# there is no home for this entry in this tree

2061

if include_deleted:

2062

return entry

2063

return None, None

2064

if entry[1][tree_index][0] != 'r':

2065

raise AssertionError(

2066

"entry %r has invalid minikind %r for tree %r" \

2067

% (entry,

2068

entry[1][tree_index][0],

2069

tree_index))

2070

real_path = entry[1][tree_index][1]

2071

return self._get_entry(tree_index, fileid_utf8=fileid_utf8,

2072

path_utf8=real_path)

2073

return None, None

2074

2075

@classmethod

2076

def initialize(cls, path, sha1_provider=None):

2077

"""Create a new dirstate on path.

2078

2079

The new dirstate will be an empty tree - that is it has no parents,

2080

and only a root node - which has id ROOT_ID.

2081

2082

:param path: The name of the file for the dirstate.

2083

:param sha1_provider: an object meeting the SHA1Provider interface.

2084

If None, a DefaultSHA1Provider is used.

2085

:return: A write-locked DirState object.

2086

"""

2087

# This constructs a new DirState object on a path, sets the _state_file

2088

# to a new empty file for that path. It then calls _set_data() with our

2089

# stock empty dirstate information - a root with ROOT_ID, no children,

2090

# and no parents. Finally it calls save() to ensure that this data will

2091

# persist.

2092

if sha1_provider is None:

2093

sha1_provider = DefaultSHA1Provider()

2094

result = cls(path, sha1_provider)

2095

# root dir and root dir contents with no children.

2096

empty_tree_dirblocks = [('', []), ('', [])]

2097

# a new root directory, with a NULLSTAT.

2098

empty_tree_dirblocks[0][1].append(

2099

(('', '', inventory.ROOT_ID), [

2100

('d', '', 0, False, DirState.NULLSTAT),

2101

]))

2102

result.lock_write()

2103

try:

2104

result._set_data([], empty_tree_dirblocks)

2105

result.save()

2106

except:

2107

result.unlock()

2108

raise

2109

return result

2110

2111

@staticmethod

2112

def _inv_entry_to_details(inv_entry):

2113

"""Convert an inventory entry (from a revision tree) to state details.

2114

2115

:param inv_entry: An inventory entry whose sha1 and link targets can be

2116

relied upon, and which has a revision set.

2117

:return: A details tuple - the details for a single tree at a path +

2118

id.

2119

"""

2120

kind = inv_entry.kind

2121

minikind = DirState._kind_to_minikind[kind]

2122

tree_data = inv_entry.revision

2123

if kind == 'directory':

2124

fingerprint = ''

2125

size = 0

2126

executable = False

2127

elif kind == 'symlink':

2128

if inv_entry.symlink_target is None:

2129

fingerprint = ''

2130

else:

2131

fingerprint = inv_entry.symlink_target.encode('utf8')

2132

size = 0

2133

executable = False

2134

elif kind == 'file':

2135

fingerprint = inv_entry.text_sha1 or ''

2136

size = inv_entry.text_size or 0

2137

executable = inv_entry.executable

2138

elif kind == 'tree-reference':

2139

fingerprint = inv_entry.reference_revision or ''

2140

size = 0

2141

executable = False

2142

else:

2143

raise Exception("can't pack %s" % inv_entry)

2144

return (minikind, fingerprint, size, executable, tree_data)

2145

2146

def _iter_child_entries(self, tree_index, path_utf8):

2147

"""Iterate over all the entries that are children of path_utf.

2148

2149

This only returns entries that are present (not in 'a', 'r') in

2150

tree_index. tree_index data is not refreshed, so if tree 0 is used,

2151

results may differ from that obtained if paths were statted to

2152

determine what ones were directories.

2153

2154

Asking for the children of a non-directory will return an empty

2155

iterator.

2156

"""

2157

pending_dirs = []

2158

next_pending_dirs = [path_utf8]

2159

absent = 'ar'

2160

while next_pending_dirs:

2161

pending_dirs = next_pending_dirs

2162

next_pending_dirs = []

2163

for path in pending_dirs:

2164

block_index, present = self._find_block_index_from_key(

2165

(path, '', ''))

2166

if block_index == 0:

2167

block_index = 1

2168

if len(self._dirblocks) == 1:

2169

# asked for the children of the root with no other

2170

# contents.

2171

return

2172

if not present:

2173

# children of a non-directory asked for.

2174

continue

2175

block = self._dirblocks[block_index]

2176

for entry in block[1]:

2177

kind = entry[1][tree_index][0]

2178

if kind not in absent:

2179

yield entry

2180

if kind == 'd':

2181

if entry[0][0]:

2182

path = entry[0][0] + '/' + entry[0][1]

2183

else:

2184

path = entry[0][1]

2185

next_pending_dirs.append(path)

2186

2187

def _iter_entries(self):

2188

"""Iterate over all the entries in the dirstate.

2189

2190

Each yelt item is an entry in the standard format described in the

2191

docstring of bzrlib.dirstate.

2192

"""

2193

self._read_dirblocks_if_needed()

2194

for directory in self._dirblocks:

2195

for entry in directory[1]:

2196

yield entry

2197

2198

def _get_id_index(self):

2199

"""Get an id index of self._dirblocks.

2200

2201

This maps from file_id => [(directory, name, file_id)] entries where

2202

that file_id appears in one of the trees.

2203

"""

2204

if self._id_index is None:

2205

id_index = {}

2206

for key, tree_details in self._iter_entries():

2207

self._add_to_id_index(id_index, key)

2208

self._id_index = id_index

2209

return self._id_index

2210

2211

def _add_to_id_index(self, id_index, entry_key):

2212

"""Add this entry to the _id_index mapping."""

2213

# This code used to use a set for every entry in the id_index. However,

2214

# it is *rare* to have more than one entry. So a set is a large

2215

# overkill. And even when we do, we won't ever have more than the

2216

# number of parent trees. Which is still a small number (rarely >2). As

2217

# such, we use a simple tuple, and do our own uniqueness checks. While

2218

# the 'in' check is O(N) since N is nicely bounded it shouldn't ever

2219

# cause quadratic failure.

2220

# TODO: This should use StaticTuple

2221

file_id = entry_key[2]

2222

entry_key = static_tuple.StaticTuple.from_sequence(entry_key)

2223

if file_id not in id_index:

2224

id_index[file_id] = static_tuple.StaticTuple(entry_key,)

2225

else:

2226

entry_keys = id_index[file_id]

2227

if entry_key not in entry_keys:

2228

id_index[file_id] = entry_keys + (entry_key,)

2229

2230

def _remove_from_id_index(self, id_index, entry_key):

2231

"""Remove this entry from the _id_index mapping.

2232

2233

It is an programming error to call this when the entry_key is not

2234

already present.

2235

"""

2236

file_id = entry_key[2]

2237

entry_keys = list(id_index[file_id])

2238

entry_keys.remove(entry_key)

2239

id_index[file_id] = static_tuple.StaticTuple.from_sequence(entry_keys)

2240

2241

def _get_output_lines(self, lines):

2242

"""Format lines for final output.

2243

2244

:param lines: A sequence of lines containing the parents list and the

2245

path lines.

2246

"""

2247

output_lines = [DirState.HEADER_FORMAT_3]

2248

lines.append('') # a final newline

2249

inventory_text = '\0\n\0'.join(lines)

2250

output_lines.append('crc32: %s\n' % (zlib.crc32(inventory_text),))

2251

# -3, 1 for num parents, 1 for ghosts, 1 for final newline

2252

num_entries = len(lines)-3

2253

output_lines.append('num_entries: %s\n' % (num_entries,))

2254

output_lines.append(inventory_text)

2255

return output_lines

2256

2257

def _make_deleted_row(self, fileid_utf8, parents):

2258

"""Return a deleted row for fileid_utf8."""

2259

return ('/', 'RECYCLED.BIN', 'file', fileid_utf8, 0, DirState.NULLSTAT,

2260

''), parents

2261

2262

def _num_present_parents(self):

2263

"""The number of parent entries in each record row."""

2264

return len(self._parents) - len(self._ghosts)

2265

2266

@classmethod

2267

def on_file(cls, path, sha1_provider=None, worth_saving_limit=0):

2268

"""Construct a DirState on the file at path "path".

2269

2270

:param path: The path at which the dirstate file on disk should live.

2271

:param sha1_provider: an object meeting the SHA1Provider interface.

2272

If None, a DefaultSHA1Provider is used.

2273

:param worth_saving_limit: when the exact number of hash changed

2274

entries is known, only bother saving the dirstate if more than

2275

this count of entries have changed. -1 means never save.

2276

:return: An unlocked DirState object, associated with the given path.

2277

"""

2278

if sha1_provider is None:

2279

sha1_provider = DefaultSHA1Provider()

2280

result = cls(path, sha1_provider,

2281

worth_saving_limit=worth_saving_limit)

2282

return result

2283

2284

def _read_dirblocks_if_needed(self):

2285

"""Read in all the dirblocks from the file if they are not in memory.

2286

2287

This populates self._dirblocks, and sets self._dirblock_state to

2288

IN_MEMORY_UNMODIFIED. It is not currently ready for incremental block

2289

2290

"""

2291

self._read_header_if_needed()

2292

if self._dirblock_state == DirState.NOT_IN_MEMORY:

2293

_read_dirblocks(self)

2294

2295

def _read_header(self):

2296

"""This reads in the metadata header, and the parent ids.

2297

2298

After reading in, the file should be positioned at the null

2299

just before the start of the first record in the file.

2300

2301

:return: (expected crc checksum, number of entries, parent list)

2302

"""

2303

self._read_prelude()

2304

parent_line = self._state_file.readline()

2305

info = parent_line.split('\0')

2306

num_parents = int(info[0])

2307

self._parents = info[1:-1]

2308

ghost_line = self._state_file.readline()

2309

info = ghost_line.split('\0')

2310

num_ghosts = int(info[1])

2311

self._ghosts = info[2:-1]

2312

self._header_state = DirState.IN_MEMORY_UNMODIFIED

2313

self._end_of_header = self._state_file.tell()

2314

2315

def _read_header_if_needed(self):

2316

"""Read the header of the dirstate file if needed."""

2317

# inline this as it will be called a lot

2318

if not self._lock_token:

2319

raise errors.ObjectNotLocked(self)

2320

if self._header_state == DirState.NOT_IN_MEMORY:

2321

self._read_header()

2322

2323

def _read_prelude(self):

2324

"""Read in the prelude header of the dirstate file.

2325

2326

This only reads in the stuff that is not connected to the crc

2327

checksum. The position will be correct to read in the rest of

2328

the file and check the checksum after this point.

2329

The next entry in the file should be the number of parents,

2330

and their ids. Followed by a newline.

2331

"""

2332

header = self._state_file.readline()

2333

if header != DirState.HEADER_FORMAT_3:

2334

raise errors.BzrError(

2335

'invalid header line: %r' % (header,))

2336

crc_line = self._state_file.readline()

2337

if not crc_line.startswith('crc32: '):

2338

raise errors.BzrError('missing crc32 checksum: %r' % crc_line)

2339

self.crc_expected = int(crc_line[len('crc32: '):-1])

2340

num_entries_line = self._state_file.readline()

2341

if not num_entries_line.startswith('num_entries: '):

2342

raise errors.BzrError('missing num_entries line')

2343

self._num_entries = int(num_entries_line[len('num_entries: '):-1])

2344

2345

def sha1_from_stat(self, path, stat_result, _pack_stat=pack_stat):

2346

"""Find a sha1 given a stat lookup."""

2347

return self._get_packed_stat_index().get(_pack_stat(stat_result), None)

2348

2349

def _get_packed_stat_index(self):

2350

"""Get a packed_stat index of self._dirblocks."""

2351

if self._packed_stat_index is None:

2352

index = {}

2353

for key, tree_details in self._iter_entries():

2354

if tree_details[0][0] == 'f':

2355

index[tree_details[0][4]] = tree_details[0][1]

2356

self._packed_stat_index = index

2357

return self._packed_stat_index

2358

2359

def save(self):

2360

"""Save any pending changes created during this session.

2361

2362

We reuse the existing file, because that prevents race conditions with

2363

file creation, and use oslocks on it to prevent concurrent modification

2364

and reads - because dirstate's incremental data aggregation is not

2365

compatible with reading a modified file, and replacing a file in use by

2366

another process is impossible on Windows.

2367

2368

A dirstate in read only mode should be smart enough though to validate

2369

that the file has not changed, and otherwise discard its cache and

2370

start over, to allow for fine grained read lock duration, so 'status'

2371

wont block 'commit' - for example.

2372

"""

2373

if self._changes_aborted:

2374

# Should this be a warning? For now, I'm expecting that places that

2375

# mark it inconsistent will warn, making a warning here redundant.

2376

trace.mutter('Not saving DirState because '

2377

'_changes_aborted is set.')

2378

return

2379

# TODO: Since we now distinguish IN_MEMORY_MODIFIED from

2380

# IN_MEMORY_HASH_MODIFIED, we should only fail quietly if we fail

2381

# to save an IN_MEMORY_HASH_MODIFIED, and fail *noisily* if we

2382

# fail to save IN_MEMORY_MODIFIED

2383

if self._worth_saving():

2384

grabbed_write_lock = False

2385

if self._lock_state != 'w':

2386

grabbed_write_lock, new_lock = self._lock_token.temporary_write_lock()

2387

# Switch over to the new lock, as the old one may be closed.

2388

# TODO: jam 20070315 We should validate the disk file has

2389

# not changed contents. Since temporary_write_lock may

2390

# not be an atomic operation.

2391

self._lock_token = new_lock

2392

self._state_file = new_lock.f

2393

if not grabbed_write_lock:

2394

# We couldn't grab a write lock, so we switch back to a read one

2395

return

2396

try:

2397

lines = self.get_lines()

2398

self._state_file.seek(0)

2399

self._state_file.writelines(lines)

2400

self._state_file.truncate()

2401

self._state_file.flush()

2402

self._mark_unmodified()

2403

finally:

2404

if grabbed_write_lock:

2405

self._lock_token = self._lock_token.restore_read_lock()

2406

self._state_file = self._lock_token.f

2407

# TODO: jam 20070315 We should validate the disk file has

2408

# not changed contents. Since restore_read_lock may

2409

# not be an atomic operation.

2410

2411

def _worth_saving(self):

2412

"""Is it worth saving the dirstate or not?"""

2413

if (self._header_state == DirState.IN_MEMORY_MODIFIED

2414

or self._dirblock_state == DirState.IN_MEMORY_MODIFIED):

2415

return True

2416

if self._dirblock_state == DirState.IN_MEMORY_HASH_MODIFIED:

2417

if self._worth_saving_limit == -1:

2418

# We never save hash changes when the limit is -1

2419

return False

2420

# If we're using smart saving and only a small number of

2421

# entries have changed their hash, don't bother saving. John has

2422

# suggested using a heuristic here based on the size of the

2423

# changed files and/or tree. For now, we go with a configurable

2424

# number of changes, keeping the calculation time

2425

# as low overhead as possible. (This also keeps all existing

2426

# tests passing as the default is 0, i.e. always save.)

2427

if len(self._known_hash_changes) >= self._worth_saving_limit:

2428

return True

2429

return False

2430

2431

def _set_data(self, parent_ids, dirblocks):

2432

"""Set the full dirstate data in memory.

2433

2434

This is an internal function used to completely replace the objects

2435

in memory state. It puts the dirstate into state 'full-dirty'.

2436

2437

:param parent_ids: A list of parent tree revision ids.

2438

:param dirblocks: A list containing one tuple for each directory in the

2439

tree. Each tuple contains the directory path and a list of entries

2440

found in that directory.

2441

"""

2442

# our memory copy is now authoritative.

2443

self._dirblocks = dirblocks

2444

self._mark_modified(header_modified=True)

2445

self._parents = list(parent_ids)

2446

self._id_index = None

2447

self._packed_stat_index = None

2448

2449

def set_path_id(self, path, new_id):

2450

"""Change the id of path to new_id in the current working tree.

2451

2452

:param path: The path inside the tree to set - '' is the root, 'foo'

2453

is the path foo in the root.

2454

:param new_id: The new id to assign to the path. This must be a utf8

2455

file id (not unicode, and not None).

2456

"""

2457

self._read_dirblocks_if_needed()

2458

if len(path):

2459

# TODO: logic not written

2460

raise NotImplementedError(self.set_path_id)

2461

# TODO: check new id is unique

2462

entry = self._get_entry(0, path_utf8=path)

2463

if entry[0][2] == new_id:

2464

# Nothing to change.

2465

return

2466

# mark the old path absent, and insert a new root path

2467

self._make_absent(entry)

2468

self.update_minimal(('', '', new_id), 'd',

2469

path_utf8='', packed_stat=entry[1][0][4])

2470

self._mark_modified()

2471

# XXX: This was added by Ian, we need to make sure there

2472

# are tests for it, because it isn't in bzr.dev TRUNK

2473

# It looks like the only place it is called is in setting the root

2474

# id of the tree. So probably we never had an _id_index when we

2475

# don't even have a root yet.

2476

if self._id_index is not None:

2477

self._add_to_id_index(self._id_index, entry[0])

2478

2479

def set_parent_trees(self, trees, ghosts):

2480

"""Set the parent trees for the dirstate.

2481

2482

:param trees: A list of revision_id, tree tuples. tree must be provided

2483

even if the revision_id refers to a ghost: supply an empty tree in

2484

this case.

2485

:param ghosts: A list of the revision_ids that are ghosts at the time

2486

of setting.

2487

"""

2488

# TODO: generate a list of parent indexes to preserve to save

2489

# processing specific parent trees. In the common case one tree will

2490

# be preserved - the left most parent.

2491

# TODO: if the parent tree is a dirstate, we might want to walk them

2492

# all by path in parallel for 'optimal' common-case performance.

2493

# generate new root row.

2494

self._read_dirblocks_if_needed()

2495

# TODO future sketch: Examine the existing parents to generate a change

2496

# map and then walk the new parent trees only, mapping them into the

2497

# dirstate. Walk the dirstate at the same time to remove unreferenced

2498

# entries.

2499

# for now:

2500

# sketch: loop over all entries in the dirstate, cherry picking

2501

# entries from the parent trees, if they are not ghost trees.

2502

# after we finish walking the dirstate, all entries not in the dirstate

2503

# are deletes, so we want to append them to the end as per the design

2504

# discussions. So do a set difference on ids with the parents to

2505

# get deletes, and add them to the end.

2506

# During the update process we need to answer the following questions:

2507

# - find other keys containing a fileid in order to create cross-path

2508

# links. We dont't trivially use the inventory from other trees

2509

# because this leads to either double touching, or to accessing

2510

# missing keys,

2511

# - find other keys containing a path

2512

# We accumulate each entry via this dictionary, including the root

2513

by_path = {}

2514

id_index = {}

2515

# we could do parallel iterators, but because file id data may be

2516

# scattered throughout, we dont save on index overhead: we have to look

2517

# at everything anyway. We can probably save cycles by reusing parent

2518

# data and doing an incremental update when adding an additional

2519

# parent, but for now the common cases are adding a new parent (merge),

2520

# and replacing completely (commit), and commit is more common: so

2521

# optimise merge later.

2522

2523

# ---- start generation of full tree mapping data

2524

# what trees should we use?

2525

parent_trees = [tree for rev_id, tree in trees if rev_id not in ghosts]

2526

# how many trees do we end up with

2527

parent_count = len(parent_trees)

2528

2529

# one: the current tree

2530

for entry in self._iter_entries():

2531

# skip entries not in the current tree

2532

if entry[1][0][0] in 'ar': # absent, relocated

2533

continue

2534

by_path[entry[0]] = [entry[1][0]] + \

2535

[DirState.NULL_PARENT_DETAILS] * parent_count

2536

# TODO: Possibly inline this, since we know it isn't present yet

2537

# id_index[entry[0][2]] = (entry[0],)

2538

self._add_to_id_index(id_index, entry[0])

2539

2540

# now the parent trees:

2541

for tree_index, tree in enumerate(parent_trees):

2542

# the index is off by one, adjust it.

2543

tree_index = tree_index + 1

2544

# when we add new locations for a fileid we need these ranges for

2545

# any fileid in this tree as we set the by_path[id] to:

2546

# already_processed_tree_details + new_details + new_location_suffix

2547

# the suffix is from tree_index+1:parent_count+1.

2548

new_location_suffix = [DirState.NULL_PARENT_DETAILS] * (parent_count - tree_index)

2549

# now stitch in all the entries from this tree

2550

for path, entry in tree.inventory.iter_entries_by_dir():

2551

# here we process each trees details for each item in the tree.

2552

# we first update any existing entries for the id at other paths,

2553

# then we either create or update the entry for the id at the

2554

# right path, and finally we add (if needed) a mapping from

2555

# file_id to this path. We do it in this order to allow us to

2556

# avoid checking all known paths for the id when generating a

2557

# new entry at this path: by adding the id->path mapping last,

2558

# all the mappings are valid and have correct relocation

2559

# records where needed.

2560

file_id = entry.file_id

2561

path_utf8 = path.encode('utf8')

2562

dirname, basename = osutils.split(path_utf8)

2563

new_entry_key = (dirname, basename, file_id)

2564

# tree index consistency: All other paths for this id in this tree

2565

# index must point to the correct path.

2566

for entry_key in id_index.get(file_id, ()):

2567

# TODO:PROFILING: It might be faster to just update

2568

# rather than checking if we need to, and then overwrite

2569

# the one we are located at.

2570

if entry_key != new_entry_key:

2571

# this file id is at a different path in one of the

2572

# other trees, so put absent pointers there

2573

# This is the vertical axis in the matrix, all pointing

2574

# to the real path.

2575

by_path[entry_key][tree_index] = ('r', path_utf8, 0, False, '')

2576

# by path consistency: Insert into an existing path record (trivial), or

2577

# add a new one with relocation pointers for the other tree indexes.

2578

entry_keys = id_index.get(file_id, ())

2579

if new_entry_key in entry_keys:

2580

# there is already an entry where this data belongs, just insert it.

2581

by_path[new_entry_key][tree_index] = \

2582

self._inv_entry_to_details(entry)

2583

else:

2584

# add relocated entries to the horizontal axis - this row

2585

# mapping from path,id. We need to look up the correct path

2586

# for the indexes from 0 to tree_index -1

2587

new_details = []

2588

for lookup_index in xrange(tree_index):

2589

# boundary case: this is the first occurence of file_id

2590

# so there are no id_indexes, possibly take this out of

2591

# the loop?

2592

if not len(entry_keys):

2593

new_details.append(DirState.NULL_PARENT_DETAILS)

2594

else:

2595

# grab any one entry, use it to find the right path.

2596

# TODO: optimise this to reduce memory use in highly

2597

# fragmented situations by reusing the relocation

2598

# records.

2599

a_key = iter(entry_keys).next()

2600

if by_path[a_key][lookup_index][0] in ('r', 'a'):

2601

# its a pointer or missing statement, use it as is.

2602

new_details.append(by_path[a_key][lookup_index])

2603

else:

2604

# we have the right key, make a pointer to it.

2605

real_path = ('/'.join(a_key[0:2])).strip('/')

2606

new_details.append(('r', real_path, 0, False, ''))

2607

new_details.append(self._inv_entry_to_details(entry))

2608

new_details.extend(new_location_suffix)

2609

by_path[new_entry_key] = new_details

2610

self._add_to_id_index(id_index, new_entry_key)

2611

# --- end generation of full tree mappings

2612

2613

# sort and output all the entries

2614

new_entries = self._sort_entries(by_path.items())

2615

self._entries_to_current_state(new_entries)

2616

self._parents = [rev_id for rev_id, tree in trees]

2617

self._ghosts = list(ghosts)

2618

self._mark_modified(header_modified=True)

2619

self._id_index = id_index

2620

2621

def _sort_entries(self, entry_list):

2622

"""Given a list of entries, sort them into the right order.

2623

2624

This is done when constructing a new dirstate from trees - normally we

2625

try to keep everything in sorted blocks all the time, but sometimes

2626

it's easier to sort after the fact.

2627

"""

2628

def _key(entry):

2629

# sort by: directory parts, file name, file id

2630

return entry[0][0].split('/'), entry[0][1], entry[0][2]

2631

return sorted(entry_list, key=_key)

2632

2633

def set_state_from_inventory(self, new_inv):

2634

"""Set new_inv as the current state.

2635

2636

This API is called by tree transform, and will usually occur with

2637

existing parent trees.

2638

2639

:param new_inv: The inventory object to set current state from.

2640

"""

2641

if 'evil' in debug.debug_flags:

2642

trace.mutter_callsite(1,

2643

"set_state_from_inventory called; please mutate the tree instead")

2644

tracing = 'dirstate' in debug.debug_flags

2645

if tracing:

2646

trace.mutter("set_state_from_inventory trace:")

2647

self._read_dirblocks_if_needed()

2648

# sketch:

2649

# Two iterators: current data and new data, both in dirblock order.

2650

# We zip them together, which tells about entries that are new in the

2651

# inventory, or removed in the inventory, or present in both and

2652

# possibly changed.

2653

2654

# You might think we could just synthesize a new dirstate directly

2655

# since we're processing it in the right order. However, we need to

2656

# also consider there may be any number of parent trees and relocation

2657

# pointers, and we don't want to duplicate that here.

2658

new_iterator = new_inv.iter_entries_by_dir()

2659

# we will be modifying the dirstate, so we need a stable iterator. In

2660

# future we might write one, for now we just clone the state into a

2661

# list using a copy so that we see every original item and don't have

2662

# to adjust the position when items are inserted or deleted in the

2663

# underlying dirstate.

2664

old_iterator = iter(list(self._iter_entries()))

2665

# both must have roots so this is safe:

2666

current_new = new_iterator.next()

2667

current_old = old_iterator.next()

2668

def advance(iterator):

2669

try:

2670

return iterator.next()

2671

except StopIteration:

2672

return None

2673

while current_new or current_old:

2674

# skip entries in old that are not really there

2675

if current_old and current_old[1][0][0] in 'ar':

2676

# relocated or absent

2677

current_old = advance(old_iterator)

2678

continue

2679

if current_new:

2680

# convert new into dirblock style

2681

new_path_utf8 = current_new[0].encode('utf8')

2682

new_dirname, new_basename = osutils.split(new_path_utf8)

2683

new_id = current_new[1].file_id

2684

new_entry_key = (new_dirname, new_basename, new_id)

2685

current_new_minikind = \

2686

DirState._kind_to_minikind[current_new[1].kind]

2687

if current_new_minikind == 't':

2688

fingerprint = current_new[1].reference_revision or ''

2689

else:

2690

# We normally only insert or remove records, or update

2691

# them when it has significantly changed. Then we want to

2692

# erase its fingerprint. Unaffected records should

2693

# normally not be updated at all.

2694

fingerprint = ''

2695

else:

2696

# for safety disable variables

2697

new_path_utf8 = new_dirname = new_basename = new_id = \

2698

new_entry_key = None

2699

# 5 cases, we dont have a value that is strictly greater than everything, so

2700

# we make both end conditions explicit

2701

if not current_old:

2702

# old is finished: insert current_new into the state.

2703

if tracing:

2704

trace.mutter("Appending from new '%s'.",

2705

new_path_utf8.decode('utf8'))

2706

self.update_minimal(new_entry_key, current_new_minikind,

2707

executable=current_new[1].executable,

2708

path_utf8=new_path_utf8, fingerprint=fingerprint,

2709

fullscan=True)

2710

current_new = advance(new_iterator)

2711

elif not current_new:

2712

# new is finished

2713

if tracing:

2714

trace.mutter("Truncating from old '%s/%s'.",

2715

current_old[0][0].decode('utf8'),

2716

current_old[0][1].decode('utf8'))

2717

self._make_absent(current_old)

2718

current_old = advance(old_iterator)

2719

elif new_entry_key == current_old[0]:

2720

# same - common case

2721

# We're looking at the same path and id in both the dirstate

2722

# and inventory, so just need to update the fields in the

2723

# dirstate from the one in the inventory.

2724

# TODO: update the record if anything significant has changed.

2725

# the minimal required trigger is if the execute bit or cached

2726

# kind has changed.

2727

if (current_old[1][0][3] != current_new[1].executable or

2728

current_old[1][0][0] != current_new_minikind):

2729

if tracing:

2730

trace.mutter("Updating in-place change '%s'.",

2731

new_path_utf8.decode('utf8'))

2732

self.update_minimal(current_old[0], current_new_minikind,

2733

executable=current_new[1].executable,

2734

path_utf8=new_path_utf8, fingerprint=fingerprint,

2735

fullscan=True)

2736

# both sides are dealt with, move on

2737

current_old = advance(old_iterator)

2738

current_new = advance(new_iterator)

2739

elif (cmp_by_dirs(new_dirname, current_old[0][0]) < 0

2740

or (new_dirname == current_old[0][0]

2741

and new_entry_key[1:] < current_old[0][1:])):

2742

# new comes before:

2743

# add a entry for this and advance new

2744

if tracing:

2745

trace.mutter("Inserting from new '%s'.",

2746

new_path_utf8.decode('utf8'))

2747

self.update_minimal(new_entry_key, current_new_minikind,

2748

executable=current_new[1].executable,

2749

path_utf8=new_path_utf8, fingerprint=fingerprint,

2750

fullscan=True)

2751

current_new = advance(new_iterator)

2752

else:

2753

# we've advanced past the place where the old key would be,

2754

# without seeing it in the new list. so it must be gone.

2755

if tracing:

2756

trace.mutter("Deleting from old '%s/%s'.",

2757

current_old[0][0].decode('utf8'),

2758

current_old[0][1].decode('utf8'))

2759

self._make_absent(current_old)

2760

current_old = advance(old_iterator)

2761

self._mark_modified()

2762

self._id_index = None

2763

self._packed_stat_index = None

2764

if tracing:

2765

trace.mutter("set_state_from_inventory complete.")

2766

2767

def set_state_from_scratch(self, working_inv, parent_trees, parent_ghosts):

2768

"""Wipe the currently stored state and set it to something new.

2769

2770

This is a hard-reset for the data we are working with.

2771

"""

2772

# Technically, we really want a write lock, but until we write, we

2773

# don't really need it.

2774

self._requires_lock()

2775

# root dir and root dir contents with no children. We have to have a

2776

# root for set_state_from_inventory to work correctly.

2777

empty_root = (('', '', inventory.ROOT_ID),

2778

[('d', '', 0, False, DirState.NULLSTAT)])

2779

empty_tree_dirblocks = [('', [empty_root]), ('', [])]

2780

self._set_data([], empty_tree_dirblocks)

2781

self.set_state_from_inventory(working_inv)

2782

self.set_parent_trees(parent_trees, parent_ghosts)

2783

2784

def _make_absent(self, current_old):

2785

"""Mark current_old - an entry - as absent for tree 0.

2786

2787

:return: True if this was the last details entry for the entry key:

2788

that is, if the underlying block has had the entry removed, thus

2789

shrinking in length.

2790

"""

2791

# build up paths that this id will be left at after the change is made,

2792

# so we can update their cross references in tree 0

2793

all_remaining_keys = set()

2794

# Dont check the working tree, because it's going.

2795

for details in current_old[1][1:]:

2796

if details[0] not in 'ar': # absent, relocated

2797

all_remaining_keys.add(current_old[0])

2798

elif details[0] == 'r': # relocated

2799

# record the key for the real path.

2800

all_remaining_keys.add(tuple(osutils.split(details[1])) + (current_old[0][2],))

2801

# absent rows are not present at any path.

2802

last_reference = current_old[0] not in all_remaining_keys

2803

if last_reference:

2804

# the current row consists entire of the current item (being marked

2805

# absent), and relocated or absent entries for the other trees:

2806

# Remove it, its meaningless.

2807

block = self._find_block(current_old[0])

2808

entry_index, present = self._find_entry_index(current_old[0], block[1])

2809

if not present:

2810

raise AssertionError('could not find entry for %s' % (current_old,))

2811

block[1].pop(entry_index)

2812

# if we have an id_index in use, remove this key from it for this id.

2813

if self._id_index is not None:

2814

self._remove_from_id_index(self._id_index, current_old[0])

2815

# update all remaining keys for this id to record it as absent. The

2816

# existing details may either be the record we are marking as deleted

2817

# (if there were other trees with the id present at this path), or may

2818

# be relocations.

2819

for update_key in all_remaining_keys:

2820

update_block_index, present = \

2821

self._find_block_index_from_key(update_key)

2822

if not present:

2823

raise AssertionError('could not find block for %s' % (update_key,))

2824

update_entry_index, present = \

2825

self._find_entry_index(update_key, self._dirblocks[update_block_index][1])

2826

if not present:

2827

raise AssertionError('could not find entry for %s' % (update_key,))

2828

update_tree_details = self._dirblocks[update_block_index][1][update_entry_index][1]

2829

# it must not be absent at the moment

2830

if update_tree_details[0][0] == 'a': # absent

2831

raise AssertionError('bad row %r' % (update_tree_details,))

2832

update_tree_details[0] = DirState.NULL_PARENT_DETAILS

2833

self._mark_modified()

2834

return last_reference

2835

2836

def update_minimal(self, key, minikind, executable=False, fingerprint='',

2837

packed_stat=None, size=0, path_utf8=None, fullscan=False):

2838

"""Update an entry to the state in tree 0.

2839

2840

This will either create a new entry at 'key' or update an existing one.

2841

It also makes sure that any other records which might mention this are

2842

updated as well.

2843

2844

:param key: (dir, name, file_id) for the new entry

2845

:param minikind: The type for the entry ('f' == 'file', 'd' ==

2846

'directory'), etc.

2847

:param executable: Should the executable bit be set?

2848

:param fingerprint: Simple fingerprint for new entry: canonical-form

2849

sha1 for files, referenced revision id for subtrees, etc.

2850

:param packed_stat: Packed stat value for new entry.

2851

:param size: Size information for new entry

2852

:param path_utf8: key[0] + '/' + key[1], just passed in to avoid doing

2853

extra computation.

2854

:param fullscan: If True then a complete scan of the dirstate is being

2855

done and checking for duplicate rows should not be done. This

2856

should only be set by set_state_from_inventory and similar methods.

2857

2858

If packed_stat and fingerprint are not given, they're invalidated in

2859

the entry.

2860

"""

2861

block = self._find_block(key)[1]

2862

if packed_stat is None:

2863

packed_stat = DirState.NULLSTAT

2864

# XXX: Some callers pass '' as the packed_stat, and it seems to be

2865

# sometimes present in the dirstate - this seems oddly inconsistent.

2866

# mbp 20071008

2867

entry_index, present = self._find_entry_index(key, block)

2868

new_details = (minikind, fingerprint, size, executable, packed_stat)

2869

id_index = self._get_id_index()

2870

if not present:

2871

# New record. Check there isn't a entry at this path already.

2872

if not fullscan:

2873

low_index, _ = self._find_entry_index(key[0:2] + ('',), block)

2874

while low_index < len(block):

2875

entry = block[low_index]

2876

if entry[0][0:2] == key[0:2]:

2877

if entry[1][0][0] not in 'ar':

2878

# This entry has the same path (but a different id) as

2879

# the new entry we're adding, and is present in ths

2880

# tree.

2881

raise errors.InconsistentDelta(

2882

("%s/%s" % key[0:2]).decode('utf8'), key[2],

2883

"Attempt to add item at path already occupied by "

2884

"id %r" % entry[0][2])

2885

low_index += 1

2886

else:

2887

break

2888

# new entry, synthesis cross reference here,

2889

existing_keys = id_index.get(key[2], ())

2890

if not existing_keys:

2891

# not currently in the state, simplest case

2892

new_entry = key, [new_details] + self._empty_parent_info()

2893

else:

2894

# present at one or more existing other paths.

2895

# grab one of them and use it to generate parent

2896

# relocation/absent entries.

2897

new_entry = key, [new_details]

2898

# existing_keys can be changed as we iterate.

2899

for other_key in tuple(existing_keys):

2900

# change the record at other to be a pointer to this new

2901

# record. The loop looks similar to the change to

2902

# relocations when updating an existing record but its not:

2903

# the test for existing kinds is different: this can be

2904

# factored out to a helper though.

2905

other_block_index, present = self._find_block_index_from_key(

2906

other_key)

2907

if not present:

2908

raise AssertionError('could not find block for %s' % (

2909

other_key,))

2910

other_block = self._dirblocks[other_block_index][1]

2911

other_entry_index, present = self._find_entry_index(

2912

other_key, other_block)

2913

if not present:

2914

raise AssertionError(

2915

'update_minimal: could not find other entry for %s'

2916

% (other_key,))

2917

if path_utf8 is None:

2918

raise AssertionError('no path')

2919

# Turn this other location into a reference to the new

2920

# location. This also updates the aliased iterator

2921

# (current_old in set_state_from_inventory) so that the old

2922

# entry, if not already examined, is skipped over by that

2923

# loop.

2924

other_entry = other_block[other_entry_index]

2925

other_entry[1][0] = ('r', path_utf8, 0, False, '')

2926

if self._maybe_remove_row(other_block, other_entry_index,

2927

id_index):

2928

# If the row holding this was removed, we need to

2929

# recompute where this entry goes

2930

entry_index, _ = self._find_entry_index(key, block)

2931

2932

# This loop:

2933

# adds a tuple to the new details for each column

2934

# - either by copying an existing relocation pointer inside that column

2935

# - or by creating a new pointer to the right row inside that column

2936

num_present_parents = self._num_present_parents()

2937

if num_present_parents:

2938

# TODO: This re-evaluates the existing_keys set, do we need

2939

# to do that ourselves?

2940

other_key = list(existing_keys)[0]

2941

for lookup_index in xrange(1, num_present_parents + 1):

2942

# grab any one entry, use it to find the right path.

2943

# TODO: optimise this to reduce memory use in highly

2944

# fragmented situations by reusing the relocation

2945

# records.

2946

update_block_index, present = \

2947

self._find_block_index_from_key(other_key)

2948

if not present:

2949

raise AssertionError('could not find block for %s' % (other_key,))

2950

update_entry_index, present = \

2951

self._find_entry_index(other_key, self._dirblocks[update_block_index][1])

2952

if not present:

2953

raise AssertionError('update_minimal: could not find entry for %s' % (other_key,))

2954

update_details = self._dirblocks[update_block_index][1][update_entry_index][1][lookup_index]

2955

if update_details[0] in 'ar': # relocated, absent

2956

# its a pointer or absent in lookup_index's tree, use

2957

# it as is.

2958

new_entry[1].append(update_details)

2959

else:

2960

# we have the right key, make a pointer to it.

2961

pointer_path = osutils.pathjoin(*other_key[0:2])

2962

new_entry[1].append(('r', pointer_path, 0, False, ''))

2963

block.insert(entry_index, new_entry)

2964

self._add_to_id_index(id_index, key)

2965

else:

2966

# Does the new state matter?

2967

block[entry_index][1][0] = new_details

2968

# parents cannot be affected by what we do.

2969

# other occurences of this id can be found

2970

# from the id index.

2971

# ---

2972

# tree index consistency: All other paths for this id in this tree

2973

# index must point to the correct path. We have to loop here because

2974

# we may have passed entries in the state with this file id already

2975

# that were absent - where parent entries are - and they need to be

2976

# converted to relocated.

2977

if path_utf8 is None:

2978

raise AssertionError('no path')

2979

existing_keys = id_index.get(key[2], ())

2980

if key not in existing_keys:

2981

raise AssertionError('We found the entry in the blocks, but'

2982

' the key is not in the id_index.'

2983

' key: %s, existing_keys: %s' % (key, existing_keys))

2984

for entry_key in existing_keys:

2985

# TODO:PROFILING: It might be faster to just update

2986

# rather than checking if we need to, and then overwrite

2987

# the one we are located at.

2988

if entry_key != key:

2989

# this file id is at a different path in one of the

2990

# other trees, so put absent pointers there

2991

# This is the vertical axis in the matrix, all pointing

2992

# to the real path.

2993

block_index, present = self._find_block_index_from_key(entry_key)

2994

if not present:

2995

raise AssertionError('not present: %r', entry_key)

2996

entry_index, present = self._find_entry_index(entry_key, self._dirblocks[block_index][1])

2997

if not present:

2998

raise AssertionError('not present: %r', entry_key)

2999

self._dirblocks[block_index][1][entry_index][1][0] = \

3000

('r', path_utf8, 0, False, '')

3001

# add a containing dirblock if needed.

3002

if new_details[0] == 'd':

3003

subdir_key = (osutils.pathjoin(*key[0:2]), '', '')

3004

block_index, present = self._find_block_index_from_key(subdir_key)

3005

if not present:

3006

self._dirblocks.insert(block_index, (subdir_key[0], []))

3007

3008

self._mark_modified()

3009

3010

def _maybe_remove_row(self, block, index, id_index):

3011

"""Remove index if it is absent or relocated across the row.

3012

3013

id_index is updated accordingly.

3014

:return: True if we removed the row, False otherwise

3015

"""

3016

present_in_row = False

3017

entry = block[index]

3018

for column in entry[1]:

3019

if column[0] not in 'ar':

3020

present_in_row = True

3021

break

3022

if not present_in_row:

3023

block.pop(index)

3024

self._remove_from_id_index(id_index, entry[0])

3025

return True

3026

return False

3027

3028

def _validate(self):

3029

"""Check that invariants on the dirblock are correct.

3030

3031

This can be useful in debugging; it shouldn't be necessary in

3032

normal code.

3033

3034

This must be called with a lock held.

3035

"""

3036

# NOTE: This must always raise AssertionError not just assert,

3037

# otherwise it may not behave properly under python -O

3038

3039

# TODO: All entries must have some content that's not 'a' or 'r',

3040

# otherwise it could just be removed.

3041

3042

# TODO: All relocations must point directly to a real entry.

3043

3044

# TODO: No repeated keys.

3045

3046

# -- mbp 20070325

3047

from pprint import pformat

3048

self._read_dirblocks_if_needed()

3049

if len(self._dirblocks) > 0:

3050

if not self._dirblocks[0][0] == '':

3051

raise AssertionError(

3052

"dirblocks don't start with root block:\n" + \

3053

pformat(self._dirblocks))

3054

if len(self._dirblocks) > 1:

3055

if not self._dirblocks[1][0] == '':

3056

raise AssertionError(

3057

"dirblocks missing root directory:\n" + \

3058

pformat(self._dirblocks))

3059

# the dirblocks are sorted by their path components, name, and dir id

3060

dir_names = [d[0].split('/')

3061

for d in self._dirblocks[1:]]

3062

if dir_names != sorted(dir_names):

3063

raise AssertionError(

3064

"dir names are not in sorted order:\n" + \

3065

pformat(self._dirblocks) + \

3066

"\nkeys:\n" +

3067

pformat(dir_names))

3068

for dirblock in self._dirblocks:

3069

# within each dirblock, the entries are sorted by filename and

3070

# then by id.

3071

for entry in dirblock[1]:

3072

if dirblock[0] != entry[0][0]:

3073

raise AssertionError(

3074

"entry key for %r"

3075

"doesn't match directory name in\n%r" %

3076

(entry, pformat(dirblock)))

3077

if dirblock[1] != sorted(dirblock[1]):

3078

raise AssertionError(

3079

"dirblock for %r is not sorted:\n%s" % \

3080

(dirblock[0], pformat(dirblock)))

3081

3082

def check_valid_parent():

3083

"""Check that the current entry has a valid parent.

3084

3085

This makes sure that the parent has a record,

3086

and that the parent isn't marked as "absent" in the

3087

current tree. (It is invalid to have a non-absent file in an absent

3088

directory.)

3089

"""

3090

if entry[0][0:2] == ('', ''):

3091

# There should be no parent for the root row

3092

return

3093

parent_entry = self._get_entry(tree_index, path_utf8=entry[0][0])

3094

if parent_entry == (None, None):

3095

raise AssertionError(

3096

"no parent entry for: %s in tree %s"

3097

% (this_path, tree_index))

3098

if parent_entry[1][tree_index][0] != 'd':

3099

raise AssertionError(

3100

"Parent entry for %s is not marked as a valid"

3101

" directory. %s" % (this_path, parent_entry,))

3102

3103

# For each file id, for each tree: either

3104

# the file id is not present at all; all rows with that id in the

3105

# key have it marked as 'absent'

3106

# OR the file id is present under exactly one name; any other entries

3107

# that mention that id point to the correct name.

3108

3109

# We check this with a dict per tree pointing either to the present

3110

# name, or None if absent.

3111

tree_count = self._num_present_parents() + 1

3112

id_path_maps = [dict() for i in range(tree_count)]

3113

# Make sure that all renamed entries point to the correct location.

3114

for entry in self._iter_entries():

3115

file_id = entry[0][2]

3116

this_path = osutils.pathjoin(entry[0][0], entry[0][1])

3117

if len(entry[1]) != tree_count:

3118

raise AssertionError(

3119

"wrong number of entry details for row\n%s" \

3120

",\nexpected %d" % \

3121

(pformat(entry), tree_count))

3122

absent_positions = 0

3123

for tree_index, tree_state in enumerate(entry[1]):

3124

this_tree_map = id_path_maps[tree_index]

3125

minikind = tree_state[0]

3126

if minikind in 'ar':

3127

absent_positions += 1

3128

# have we seen this id before in this column?

3129

if file_id in this_tree_map:

3130

previous_path, previous_loc = this_tree_map[file_id]

3131

# any later mention of this file must be consistent with

3132

# what was said before

3133

if minikind == 'a':

3134

if previous_path is not None:

3135

raise AssertionError(

3136

"file %s is absent in row %r but also present " \

3137

"at %r"% \

3138

(file_id, entry, previous_path))

3139

elif minikind == 'r':

3140

target_location = tree_state[1]

3141

if previous_path != target_location:

3142

raise AssertionError(

3143

"file %s relocation in row %r but also at %r" \

3144

% (file_id, entry, previous_path))

3145

else:

3146

# a file, directory, etc - may have been previously

3147

# pointed to by a relocation, which must point here

3148

if previous_path != this_path:

3149

raise AssertionError(

3150

"entry %r inconsistent with previous path %r "

3151

"seen at %r" %

3152

(entry, previous_path, previous_loc))

3153

check_valid_parent()

3154

else:

3155

if minikind == 'a':

3156

# absent; should not occur anywhere else

3157

this_tree_map[file_id] = None, this_path

3158

elif minikind == 'r':

3159

# relocation, must occur at expected location

3160

this_tree_map[file_id] = tree_state[1], this_path

3161

else:

3162

this_tree_map[file_id] = this_path, this_path

3163

check_valid_parent()

3164

if absent_positions == tree_count:

3165

raise AssertionError(

3166

"entry %r has no data for any tree." % (entry,))

3167

if self._id_index is not None:

3168

for file_id, entry_keys in self._id_index.iteritems():

3169

for entry_key in entry_keys:

3170

if entry_key[2] != file_id:

3171

raise AssertionError(

3172

'file_id %r did not match entry key %s'

3173

% (file_id, entry_key))

3174

if len(entry_keys) != len(set(entry_keys)):

3175

raise AssertionError(

3176

'id_index contained non-unique data for %s'

3177

% (entry_keys,))

3178

3179

def _wipe_state(self):

3180

"""Forget all state information about the dirstate."""

3181

self._header_state = DirState.NOT_IN_MEMORY

3182

self._dirblock_state = DirState.NOT_IN_MEMORY

3183

self._changes_aborted = False

3184

self._parents = []

3185

self._ghosts = []

3186

self._dirblocks = []

3187

self._id_index = None

3188

self._packed_stat_index = None

3189

self._end_of_header = None

3190

self._cutoff_time = None

3191

self._split_path_cache = {}

3192

3193

def lock_read(self):

3194

"""Acquire a read lock on the dirstate."""

3195

if self._lock_token is not None:

3196

raise errors.LockContention(self._lock_token)

3197

# TODO: jam 20070301 Rather than wiping completely, if the blocks are

3198

# already in memory, we could read just the header and check for

3199

# any modification. If not modified, we can just leave things

3200

# alone

3201

self._lock_token = lock.ReadLock(self._filename)

3202

self._lock_state = 'r'

3203

self._state_file = self._lock_token.f

3204

self._wipe_state()

3205

3206

def lock_write(self):

3207

"""Acquire a write lock on the dirstate."""

3208

if self._lock_token is not None:

3209

raise errors.LockContention(self._lock_token)

3210

# TODO: jam 20070301 Rather than wiping completely, if the blocks are

3211

# already in memory, we could read just the header and check for

3212

# any modification. If not modified, we can just leave things

3213

# alone

3214

self._lock_token = lock.WriteLock(self._filename)

3215

self._lock_state = 'w'

3216

self._state_file = self._lock_token.f

3217

self._wipe_state()

3218

3219

def unlock(self):

3220

"""Drop any locks held on the dirstate."""

3221

if self._lock_token is None:

3222

raise errors.LockNotHeld(self)

3223

# TODO: jam 20070301 Rather than wiping completely, if the blocks are

3224

# already in memory, we could read just the header and check for

3225

# any modification. If not modified, we can just leave things

3226

# alone

3227

self._state_file = None

3228

self._lock_state = None

3229

self._lock_token.unlock()

3230

self._lock_token = None

3231

self._split_path_cache = {}

3232

3233

def _requires_lock(self):

3234

"""Check that a lock is currently held by someone on the dirstate."""

3235

if not self._lock_token:

3236

raise errors.ObjectNotLocked(self)

3237

3238

3239

def py_update_entry(state, entry, abspath, stat_value,

3240

_stat_to_minikind=DirState._stat_to_minikind,

3241

_pack_stat=pack_stat):

3242

"""Update the entry based on what is actually on disk.

3243

3244

This function only calculates the sha if it needs to - if the entry is

3245

uncachable, or clearly different to the first parent's entry, no sha

3246

is calculated, and None is returned.

3247

3248

:param state: The dirstate this entry is in.

3249

:param entry: This is the dirblock entry for the file in question.

3250

:param abspath: The path on disk for this file.

3251

:param stat_value: The stat value done on the path.

3252

:return: None, or The sha1 hexdigest of the file (40 bytes) or link

3253

target of a symlink.

3254

"""

3255

try:

3256

minikind = _stat_to_minikind[stat_value.st_mode & 0170000]

3257

except KeyError:

3258

# Unhandled kind

3259

return None

3260

packed_stat = _pack_stat(stat_value)

3261

(saved_minikind, saved_link_or_sha1, saved_file_size,

3262

saved_executable, saved_packed_stat) = entry[1][0]

3263

3264

if minikind == 'd' and saved_minikind == 't':

3265

minikind = 't'

3266

if (minikind == saved_minikind

3267

and packed_stat == saved_packed_stat):

3268

# The stat hasn't changed since we saved, so we can re-use the

3269

# saved sha hash.

3270

if minikind == 'd':

3271

return None

3272

3273

# size should also be in packed_stat

3274

if saved_file_size == stat_value.st_size:

3275

return saved_link_or_sha1

3276

3277

# If we have gotten this far, that means that we need to actually

3278

# process this entry.

3279

link_or_sha1 = None

3280

worth_saving = True

3281

if minikind == 'f':

3282

executable = state._is_executable(stat_value.st_mode,

3283

saved_executable)

3284

if state._cutoff_time is None:

3285

state._sha_cutoff_time()

3286

if (stat_value.st_mtime < state._cutoff_time

3287

and stat_value.st_ctime < state._cutoff_time

3288

and len(entry[1]) > 1

3289

and entry[1][1][0] != 'a'):

3290

# Could check for size changes for further optimised

3291

# avoidance of sha1's. However the most prominent case of

3292

# over-shaing is during initial add, which this catches.

3293

# Besides, if content filtering happens, size and sha

3294

# are calculated at the same time, so checking just the size

3295

# gains nothing w.r.t. performance.

3296

link_or_sha1 = state._sha1_file(abspath)

3297

entry[1][0] = ('f', link_or_sha1, stat_value.st_size,

3298

executable, packed_stat)

3299

else:

3300

entry[1][0] = ('f', '', stat_value.st_size,

3301

executable, DirState.NULLSTAT)

3302

worth_saving = False

3303

elif minikind == 'd':

3304

link_or_sha1 = None

3305

entry[1][0] = ('d', '', 0, False, packed_stat)

3306

if saved_minikind != 'd':

3307

# This changed from something into a directory. Make sure we

3308

# have a directory block for it. This doesn't happen very

3309

# often, so this doesn't have to be super fast.

3310

block_index, entry_index, dir_present, file_present = \

3311

state._get_block_entry_index(entry[0][0], entry[0][1], 0)

3312

state._ensure_block(block_index, entry_index,

3313

osutils.pathjoin(entry[0][0], entry[0][1]))

3314

else:

3315

worth_saving = False

3316

elif minikind == 'l':

3317

if saved_minikind == 'l':

3318

worth_saving = False

3319

link_or_sha1 = state._read_link(abspath, saved_link_or_sha1)

3320

if state._cutoff_time is None:

3321

state._sha_cutoff_time()

3322

if (stat_value.st_mtime < state._cutoff_time

3323

and stat_value.st_ctime < state._cutoff_time):

3324

entry[1][0] = ('l', link_or_sha1, stat_value.st_size,

3325

False, packed_stat)

3326

else:

3327

entry[1][0] = ('l', '', stat_value.st_size,

3328

False, DirState.NULLSTAT)

3329

if worth_saving:

3330

state._mark_modified([entry])

3331

return link_or_sha1

3332

3333

3334

class ProcessEntryPython(object):

3335

3336

__slots__ = ["old_dirname_to_file_id", "new_dirname_to_file_id",

3337

"last_source_parent", "last_target_parent", "include_unchanged",

3338

"partial", "use_filesystem_for_exec", "utf8_decode",

3339

"searched_specific_files", "search_specific_files",

3340

"searched_exact_paths", "search_specific_file_parents", "seen_ids",

3341

"state", "source_index", "target_index", "want_unversioned", "tree"]

3342

3343

def __init__(self, include_unchanged, use_filesystem_for_exec,

3344

search_specific_files, state, source_index, target_index,

3345

want_unversioned, tree):

3346

self.old_dirname_to_file_id = {}

3347

self.new_dirname_to_file_id = {}

3348

# Are we doing a partial iter_changes?

3349

self.partial = search_specific_files != set([''])

3350

# Using a list so that we can access the values and change them in

3351

# nested scope. Each one is [path, file_id, entry]

3352

self.last_source_parent = [None, None]

3353

self.last_target_parent = [None, None]

3354

self.include_unchanged = include_unchanged

3355

self.use_filesystem_for_exec = use_filesystem_for_exec

3356

self.utf8_decode = cache_utf8._utf8_decode

3357

# for all search_indexs in each path at or under each element of

3358

# search_specific_files, if the detail is relocated: add the id, and

3359

# add the relocated path as one to search if its not searched already.

3360

# If the detail is not relocated, add the id.

3361

self.searched_specific_files = set()

3362

# When we search exact paths without expanding downwards, we record

3363

# that here.

3364

self.searched_exact_paths = set()

3365

self.search_specific_files = search_specific_files

3366

# The parents up to the root of the paths we are searching.

3367

# After all normal paths are returned, these specific items are returned.

3368

self.search_specific_file_parents = set()

3369

# The ids we've sent out in the delta.

3370

self.seen_ids = set()

3371

self.state = state

3372

self.source_index = source_index

3373

self.target_index = target_index

3374

if target_index != 0:

3375

# A lot of code in here depends on target_index == 0

3376

raise errors.BzrError('unsupported target index')

3377

self.want_unversioned = want_unversioned

3378

self.tree = tree

3379

3380

def _process_entry(self, entry, path_info, pathjoin=osutils.pathjoin):

3381

"""Compare an entry and real disk to generate delta information.

3382

3383

:param path_info: top_relpath, basename, kind, lstat, abspath for

3384

the path of entry. If None, then the path is considered absent in

3385

the target (Perhaps we should pass in a concrete entry for this ?)

3386

Basename is returned as a utf8 string because we expect this

3387

tuple will be ignored, and don't want to take the time to

3388

decode.

3389

:return: (iter_changes_result, changed). If the entry has not been

3390

handled then changed is None. Otherwise it is False if no content

3391

or metadata changes have occurred, and True if any content or

3392

metadata change has occurred. If self.include_unchanged is True then

3393

if changed is not None, iter_changes_result will always be a result

3394

tuple. Otherwise, iter_changes_result is None unless changed is

3395

True.

3396

"""

3397

if self.source_index is None:

3398

source_details = DirState.NULL_PARENT_DETAILS

3399

else:

3400

source_details = entry[1][self.source_index]

3401

target_details = entry[1][self.target_index]

3402

target_minikind = target_details[0]

3403

if path_info is not None and target_minikind in 'fdlt':

3404

if not (self.target_index == 0):

3405

raise AssertionError()

3406

link_or_sha1 = update_entry(self.state, entry,

3407

abspath=path_info[4], stat_value=path_info[3])

3408

# The entry may have been modified by update_entry

3409

target_details = entry[1][self.target_index]

3410

target_minikind = target_details[0]

3411

else:

3412

link_or_sha1 = None

3413

file_id = entry[0][2]

3414

source_minikind = source_details[0]

3415

if source_minikind in 'fdltr' and target_minikind in 'fdlt':

3416

# claimed content in both: diff

3417

# r | fdlt | | add source to search, add id path move and perform

3418

# | | | diff check on source-target

3419

# r | fdlt | a | dangling file that was present in the basis.

3420

# | | | ???

3421

if source_minikind in 'r':

3422

# add the source to the search path to find any children it

3423

# has. TODO ? : only add if it is a container ?

3424

if not osutils.is_inside_any(self.searched_specific_files,

3425

source_details[1]):

3426

self.search_specific_files.add(source_details[1])

3427

# generate the old path; this is needed for stating later

3428

# as well.

3429

old_path = source_details[1]

3430

old_dirname, old_basename = os.path.split(old_path)

3431

path = pathjoin(entry[0][0], entry[0][1])

3432

old_entry = self.state._get_entry(self.source_index,

3433

path_utf8=old_path)

3434

# update the source details variable to be the real

3435

# location.

3436

if old_entry == (None, None):

3437

raise errors.CorruptDirstate(self.state._filename,

3438

"entry '%s/%s' is considered renamed from %r"

3439

" but source does not exist\n"

3440

"entry: %s" % (entry[0][0], entry[0][1], old_path, entry))

3441

source_details = old_entry[1][self.source_index]

3442

source_minikind = source_details[0]

3443

else:

3444

old_dirname = entry[0][0]

3445

old_basename = entry[0][1]

3446

old_path = path = None

3447

if path_info is None:

3448

# the file is missing on disk, show as removed.

3449

content_change = True

3450

target_kind = None

3451

target_exec = False

3452

else:

3453

# source and target are both versioned and disk file is present.

3454

target_kind = path_info[2]

3455

if target_kind == 'directory':

3456

if path is None:

3457

old_path = path = pathjoin(old_dirname, old_basename)

3458

self.new_dirname_to_file_id[path] = file_id

3459

if source_minikind != 'd':

3460

content_change = True

3461

else:

3462

# directories have no fingerprint

3463

content_change = False

3464

target_exec = False

3465

elif target_kind == 'file':

3466

if source_minikind != 'f':

3467

content_change = True

3468

else:

3469

# Check the sha. We can't just rely on the size as

3470

# content filtering may mean differ sizes actually

3471

# map to the same content

3472

if link_or_sha1 is None:

3473

# Stat cache miss:

3474

statvalue, link_or_sha1 = \

3475

self.state._sha1_provider.stat_and_sha1(

3476

path_info[4])

3477

self.state._observed_sha1(entry, link_or_sha1,

3478

statvalue)

3479

content_change = (link_or_sha1 != source_details[1])

3480

# Target details is updated at update_entry time

3481

if self.use_filesystem_for_exec:

3482

# We don't need S_ISREG here, because we are sure

3483

# we are dealing with a file.

3484

target_exec = bool(stat.S_IEXEC & path_info[3].st_mode)

3485

else:

3486

target_exec = target_details[3]

3487

elif target_kind == 'symlink':

3488

if source_minikind != 'l':

3489

content_change = True

3490

else:

3491

content_change = (link_or_sha1 != source_details[1])

3492

target_exec = False

3493

elif target_kind == 'tree-reference':

3494

if source_minikind != 't':

3495

content_change = True

3496

else:

3497

content_change = False

3498

target_exec = False

3499

else:

3500

if path is None:

3501

path = pathjoin(old_dirname, old_basename)

3502

raise errors.BadFileKindError(path, path_info[2])

3503

if source_minikind == 'd':

3504

if path is None:

3505

old_path = path = pathjoin(old_dirname, old_basename)

3506

self.old_dirname_to_file_id[old_path] = file_id

3507

# parent id is the entry for the path in the target tree

3508

if old_basename and old_dirname == self.last_source_parent[0]:

3509

source_parent_id = self.last_source_parent[1]

3510

else:

3511

try:

3512

source_parent_id = self.old_dirname_to_file_id[old_dirname]

3513

except KeyError:

3514

source_parent_entry = self.state._get_entry(self.source_index,

3515

path_utf8=old_dirname)

3516

source_parent_id = source_parent_entry[0][2]

3517

if source_parent_id == entry[0][2]:

3518

# This is the root, so the parent is None

3519

source_parent_id = None

3520

else:

3521

self.last_source_parent[0] = old_dirname

3522

self.last_source_parent[1] = source_parent_id

3523

new_dirname = entry[0][0]

3524

if entry[0][1] and new_dirname == self.last_target_parent[0]:

3525

target_parent_id = self.last_target_parent[1]

3526

else:

3527

try:

3528

target_parent_id = self.new_dirname_to_file_id[new_dirname]

3529

except KeyError:

3530

# TODO: We don't always need to do the lookup, because the

3531

# parent entry will be the same as the source entry.

3532

target_parent_entry = self.state._get_entry(self.target_index,

3533

path_utf8=new_dirname)

3534

if target_parent_entry == (None, None):

3535

raise AssertionError(

3536

"Could not find target parent in wt: %s\nparent of: %s"

3537

% (new_dirname, entry))

3538

target_parent_id = target_parent_entry[0][2]

3539

if target_parent_id == entry[0][2]:

3540

# This is the root, so the parent is None

3541

target_parent_id = None

3542

else:

3543

self.last_target_parent[0] = new_dirname

3544

self.last_target_parent[1] = target_parent_id

3545

3546

source_exec = source_details[3]

3547

changed = (content_change

3548

or source_parent_id != target_parent_id

3549

or old_basename != entry[0][1]

3550

or source_exec != target_exec

3551

)

3552

if not changed and not self.include_unchanged:

3553

return None, False

3554

else:

3555

if old_path is None:

3556

old_path = path = pathjoin(old_dirname, old_basename)

3557

old_path_u = self.utf8_decode(old_path)[0]

3558

path_u = old_path_u

3559

else:

3560

old_path_u = self.utf8_decode(old_path)[0]

3561

if old_path == path:

3562

path_u = old_path_u

3563

else:

3564

path_u = self.utf8_decode(path)[0]

3565

source_kind = DirState._minikind_to_kind[source_minikind]

3566

return (entry[0][2],

3567

(old_path_u, path_u),

3568

content_change,

3569

(True, True),

3570

(source_parent_id, target_parent_id),

3571

(self.utf8_decode(old_basename)[0], self.utf8_decode(entry[0][1])[0]),

3572

(source_kind, target_kind),

3573

(source_exec, target_exec)), changed

3574

elif source_minikind in 'a' and target_minikind in 'fdlt':

3575

# looks like a new file

3576

path = pathjoin(entry[0][0], entry[0][1])

3577

# parent id is the entry for the path in the target tree

3578

# TODO: these are the same for an entire directory: cache em.

3579

parent_id = self.state._get_entry(self.target_index,

3580

path_utf8=entry[0][0])[0][2]

3581

if parent_id == entry[0][2]:

3582

parent_id = None

3583

if path_info is not None:

3584

# Present on disk:

3585

if self.use_filesystem_for_exec:

3586

# We need S_ISREG here, because we aren't sure if this

3587

# is a file or not.

3588

target_exec = bool(

3589

stat.S_ISREG(path_info[3].st_mode)

3590

and stat.S_IEXEC & path_info[3].st_mode)

3591

else:

3592

target_exec = target_details[3]

3593

return (entry[0][2],

3594

(None, self.utf8_decode(path)[0]),

3595

True,

3596

(False, True),

3597

(None, parent_id),

3598

(None, self.utf8_decode(entry[0][1])[0]),

3599

(None, path_info[2]),

3600

(None, target_exec)), True

3601

else:

3602

# Its a missing file, report it as such.

3603

return (entry[0][2],

3604

(None, self.utf8_decode(path)[0]),

3605

False,

3606

(False, True),

3607

(None, parent_id),

3608

(None, self.utf8_decode(entry[0][1])[0]),

3609

(None, None),

3610

(None, False)), True

3611

elif source_minikind in 'fdlt' and target_minikind in 'a':

3612

# unversioned, possibly, or possibly not deleted: we dont care.

3613

# if its still on disk, *and* theres no other entry at this

3614

# path [we dont know this in this routine at the moment -

3615

# perhaps we should change this - then it would be an unknown.

3616

old_path = pathjoin(entry[0][0], entry[0][1])

3617

# parent id is the entry for the path in the target tree

3618

parent_id = self.state._get_entry(self.source_index, path_utf8=entry[0][0])[0][2]

3619

if parent_id == entry[0][2]:

3620

parent_id = None

3621

return (entry[0][2],

3622

(self.utf8_decode(old_path)[0], None),

3623

True,

3624

(True, False),

3625

(parent_id, None),

3626

(self.utf8_decode(entry[0][1])[0], None),

3627

(DirState._minikind_to_kind[source_minikind], None),

3628

(source_details[3], None)), True

3629

elif source_minikind in 'fdlt' and target_minikind in 'r':

3630

# a rename; could be a true rename, or a rename inherited from

3631

# a renamed parent. TODO: handle this efficiently. Its not

3632

# common case to rename dirs though, so a correct but slow

3633

# implementation will do.

3634

if not osutils.is_inside_any(self.searched_specific_files, target_details[1]):

3635

self.search_specific_files.add(target_details[1])

3636

elif source_minikind in 'ra' and target_minikind in 'ra':

3637

# neither of the selected trees contain this file,

3638

# so skip over it. This is not currently directly tested, but

3639

# is indirectly via test_too_much.TestCommands.test_conflicts.

3640

pass

3641

else:

3642

raise AssertionError("don't know how to compare "

3643

"source_minikind=%r, target_minikind=%r"

3644

% (source_minikind, target_minikind))

3645

## import pdb;pdb.set_trace()

3646

return None, None

3647

3648

def __iter__(self):

3649

return self

3650

3651

def _gather_result_for_consistency(self, result):

3652

"""Check a result we will yield to make sure we are consistent later.

3653

3654

This gathers result's parents into a set to output later.

3655

3656

:param result: A result tuple.

3657

"""

3658

if not self.partial or not result[0]:

3659

return

3660

self.seen_ids.add(result[0])

3661

new_path = result[1][1]

3662

if new_path:

3663

# Not the root and not a delete: queue up the parents of the path.

3664

self.search_specific_file_parents.update(

3665

osutils.parent_directories(new_path.encode('utf8')))

3666

# Add the root directory which parent_directories does not

3667

# provide.

3668

self.search_specific_file_parents.add('')

3669

3670

def iter_changes(self):

3671

"""Iterate over the changes."""

3672

utf8_decode = cache_utf8._utf8_decode

3673

_cmp_by_dirs = cmp_by_dirs

3674

_process_entry = self._process_entry

3675

search_specific_files = self.search_specific_files

3676

searched_specific_files = self.searched_specific_files

3677

splitpath = osutils.splitpath

3678

# sketch:

3679

# compare source_index and target_index at or under each element of search_specific_files.

3680

# follow the following comparison table. Note that we only want to do diff operations when

3681

# the target is fdl because thats when the walkdirs logic will have exposed the pathinfo

3682

# for the target.

3683

# cases:

3684

3685

# Source | Target | disk | action

3686

# r | fdlt | | add source to search, add id path move and perform

3687

# | | | diff check on source-target

3688

# r | fdlt | a | dangling file that was present in the basis.

3689

# | | | ???

3690

# r | a | | add source to search

3691

# r | a | a |

3692

# r | r | | this path is present in a non-examined tree, skip.

3693

# r | r | a | this path is present in a non-examined tree, skip.

3694

# a | fdlt | | add new id

3695

# a | fdlt | a | dangling locally added file, skip

3696

# a | a | | not present in either tree, skip

3697

# a | a | a | not present in any tree, skip

3698

# a | r | | not present in either tree at this path, skip as it

3699

# | | | may not be selected by the users list of paths.

3700

# a | r | a | not present in either tree at this path, skip as it

3701

# | | | may not be selected by the users list of paths.

3702

# fdlt | fdlt | | content in both: diff them

3703

# fdlt | fdlt | a | deleted locally, but not unversioned - show as deleted ?

3704

# fdlt | a | | unversioned: output deleted id for now

3705

# fdlt | a | a | unversioned and deleted: output deleted id

3706

# fdlt | r | | relocated in this tree, so add target to search.

3707

# | | | Dont diff, we will see an r,fd; pair when we reach

3708

# | | | this id at the other path.

3709

# fdlt | r | a | relocated in this tree, so add target to search.

3710

# | | | Dont diff, we will see an r,fd; pair when we reach

3711

# | | | this id at the other path.

3712

3713

# TODO: jam 20070516 - Avoid the _get_entry lookup overhead by

3714

# keeping a cache of directories that we have seen.

3715

3716

while search_specific_files:

3717

# TODO: the pending list should be lexically sorted? the

3718

# interface doesn't require it.

3719

current_root = search_specific_files.pop()

3720

current_root_unicode = current_root.decode('utf8')

3721

searched_specific_files.add(current_root)

3722

# process the entries for this containing directory: the rest will be

3723

# found by their parents recursively.

3724

root_entries = self.state._entries_for_path(current_root)

3725

root_abspath = self.tree.abspath(current_root_unicode)

3726

try:

3727

root_stat = os.lstat(root_abspath)

3728

except OSError, e:

3729

if e.errno == errno.ENOENT:

3730

# the path does not exist: let _process_entry know that.

3731

root_dir_info = None

3732

else:

3733

# some other random error: hand it up.

3734

raise

3735

else:

3736

root_dir_info = ('', current_root,

3737

osutils.file_kind_from_stat_mode(root_stat.st_mode), root_stat,

3738

root_abspath)

3739

if root_dir_info[2] == 'directory':

3740

if self.tree._directory_is_tree_reference(

3741

current_root.decode('utf8')):

3742

root_dir_info = root_dir_info[:2] + \

3743

('tree-reference',) + root_dir_info[3:]

3744

3745

if not root_entries and not root_dir_info:

3746

# this specified path is not present at all, skip it.

3747

continue

3748

path_handled = False

3749

for entry in root_entries:

3750

result, changed = _process_entry(entry, root_dir_info)

3751

if changed is not None:

3752

path_handled = True

3753

if changed:

3754

self._gather_result_for_consistency(result)

3755

if changed or self.include_unchanged:

3756

yield result

3757

if self.want_unversioned and not path_handled and root_dir_info:

3758

new_executable = bool(

3759

stat.S_ISREG(root_dir_info[3].st_mode)

3760

and stat.S_IEXEC & root_dir_info[3].st_mode)

3761

yield (None,

3762

(None, current_root_unicode),

3763

True,

3764

(False, False),

3765

(None, None),

3766

(None, splitpath(current_root_unicode)[-1]),

3767

(None, root_dir_info[2]),

3768

(None, new_executable)

3769

)

3770

initial_key = (current_root, '', '')

3771

block_index, _ = self.state._find_block_index_from_key(initial_key)

3772

if block_index == 0:

3773

# we have processed the total root already, but because the

3774

# initial key matched it we should skip it here.

3775

block_index +=1

3776

if root_dir_info and root_dir_info[2] == 'tree-reference':

3777

current_dir_info = None

3778

else:

3779

dir_iterator = osutils._walkdirs_utf8(root_abspath, prefix=current_root)

3780

try:

3781

current_dir_info = dir_iterator.next()

3782

except OSError, e:

3783

# on win32, python2.4 has e.errno == ERROR_DIRECTORY, but

3784

# python 2.5 has e.errno == EINVAL,

3785

# and e.winerror == ERROR_DIRECTORY

3786

e_winerror = getattr(e, 'winerror', None)

3787

win_errors = (ERROR_DIRECTORY, ERROR_PATH_NOT_FOUND)

3788

# there may be directories in the inventory even though

3789

# this path is not a file on disk: so mark it as end of

3790

# iterator

3791

if e.errno in (errno.ENOENT, errno.ENOTDIR, errno.EINVAL):

3792

current_dir_info = None

3793

elif (sys.platform == 'win32'

3794

and (e.errno in win_errors

3795

or e_winerror in win_errors)):

3796

current_dir_info = None

3797

else:

3798

raise

3799

else:

3800

if current_dir_info[0][0] == '':

3801

# remove .bzr from iteration

3802

bzr_index = bisect.bisect_left(current_dir_info[1], ('.bzr',))

3803

if current_dir_info[1][bzr_index][0] != '.bzr':

3804

raise AssertionError()

3805

del current_dir_info[1][bzr_index]

3806

# walk until both the directory listing and the versioned metadata

3807

# are exhausted.

3808

if (block_index < len(self.state._dirblocks) and

3809

osutils.is_inside(current_root, self.state._dirblocks[block_index][0])):

3810

current_block = self.state._dirblocks[block_index]

3811

else:

3812

current_block = None

3813

while (current_dir_info is not None or

3814

current_block is not None):

3815

if (current_dir_info and current_block

3816

and current_dir_info[0][0] != current_block[0]):

3817

if _cmp_by_dirs(current_dir_info[0][0], current_block[0]) < 0:

3818

# filesystem data refers to paths not covered by the dirblock.

3819

# this has two possibilities:

3820

# A) it is versioned but empty, so there is no block for it

3821

# B) it is not versioned.

3822

3823

# if (A) then we need to recurse into it to check for

3824

# new unknown files or directories.

3825

# if (B) then we should ignore it, because we don't

3826

# recurse into unknown directories.

3827

path_index = 0

3828

while path_index < len(current_dir_info[1]):

3829

current_path_info = current_dir_info[1][path_index]

3830

if self.want_unversioned:

3831

if current_path_info[2] == 'directory':

3832

if self.tree._directory_is_tree_reference(

3833

current_path_info[0].decode('utf8')):

3834

current_path_info = current_path_info[:2] + \

3835

('tree-reference',) + current_path_info[3:]

3836

new_executable = bool(

3837

stat.S_ISREG(current_path_info[3].st_mode)

3838

and stat.S_IEXEC & current_path_info[3].st_mode)

3839

yield (None,

3840

(None, utf8_decode(current_path_info[0])[0]),

3841

True,

3842

(False, False),

3843

(None, None),

3844

(None, utf8_decode(current_path_info[1])[0]),

3845

(None, current_path_info[2]),

3846

(None, new_executable))

3847

# dont descend into this unversioned path if it is

3848

# a dir

3849

if current_path_info[2] in ('directory',

3850

'tree-reference'):

3851

del current_dir_info[1][path_index]

3852

path_index -= 1

3853

path_index += 1

3854

3855

# This dir info has been handled, go to the next

3856

try:

3857

current_dir_info = dir_iterator.next()

3858

except StopIteration:

3859

current_dir_info = None

3860

else:

3861

# We have a dirblock entry for this location, but there

3862

# is no filesystem path for this. This is most likely

3863

# because a directory was removed from the disk.

3864

# We don't have to report the missing directory,

3865

# because that should have already been handled, but we

3866

# need to handle all of the files that are contained

3867

# within.

3868

for current_entry in current_block[1]:

3869

# entry referring to file not present on disk.

3870

# advance the entry only, after processing.

3871

result, changed = _process_entry(current_entry, None)

3872

if changed is not None:

3873

if changed:

3874

self._gather_result_for_consistency(result)

3875

if changed or self.include_unchanged:

3876

yield result

3877

block_index +=1

3878

if (block_index < len(self.state._dirblocks) and

3879

osutils.is_inside(current_root,

3880

self.state._dirblocks[block_index][0])):

3881

current_block = self.state._dirblocks[block_index]

3882

else:

3883

current_block = None

3884

continue

3885

entry_index = 0

3886

if current_block and entry_index < len(current_block[1]):

3887

current_entry = current_block[1][entry_index]

3888

else:

3889

current_entry = None

3890

advance_entry = True

3891

path_index = 0

3892

if current_dir_info and path_index < len(current_dir_info[1]):

3893

current_path_info = current_dir_info[1][path_index]

3894

if current_path_info[2] == 'directory':

3895

if self.tree._directory_is_tree_reference(

3896

current_path_info[0].decode('utf8')):

3897

current_path_info = current_path_info[:2] + \

3898

('tree-reference',) + current_path_info[3:]

3899

else:

3900

current_path_info = None

3901

advance_path = True

3902

path_handled = False

3903

while (current_entry is not None or

3904

current_path_info is not None):

3905

if current_entry is None:

3906

# the check for path_handled when the path is advanced

3907

# will yield this path if needed.

3908

pass

3909

elif current_path_info is None:

3910

# no path is fine: the per entry code will handle it.

3911

result, changed = _process_entry(current_entry, current_path_info)

3912

if changed is not None:

3913

if changed:

3914

self._gather_result_for_consistency(result)

3915

if changed or self.include_unchanged:

3916

yield result

3917

elif (current_entry[0][1] != current_path_info[1]

3918

or current_entry[1][self.target_index][0] in 'ar'):

3919

# The current path on disk doesn't match the dirblock

3920

# record. Either the dirblock is marked as absent, or

3921

# the file on disk is not present at all in the

3922

# dirblock. Either way, report about the dirblock

3923

# entry, and let other code handle the filesystem one.

3924

3925

# Compare the basename for these files to determine

3926

# which comes first

3927

if current_path_info[1] < current_entry[0][1]:

3928

# extra file on disk: pass for now, but only

3929

# increment the path, not the entry

3930

advance_entry = False

3931

else:

3932

# entry referring to file not present on disk.

3933

# advance the entry only, after processing.

3934

result, changed = _process_entry(current_entry, None)

3935

if changed is not None:

3936

if changed:

3937

self._gather_result_for_consistency(result)

3938

if changed or self.include_unchanged:

3939

yield result

3940

advance_path = False

3941

else:

3942

result, changed = _process_entry(current_entry, current_path_info)

3943

if changed is not None:

3944

path_handled = True

3945

if changed:

3946

self._gather_result_for_consistency(result)

3947

if changed or self.include_unchanged:

3948

yield result

3949

if advance_entry and current_entry is not None:

3950

entry_index += 1

3951

if entry_index < len(current_block[1]):

3952

current_entry = current_block[1][entry_index]

3953

else:

3954

current_entry = None

3955

else:

3956

advance_entry = True # reset the advance flaga

3957

if advance_path and current_path_info is not None:

3958

if not path_handled:

3959

# unversioned in all regards

3960

if self.want_unversioned:

3961

new_executable = bool(

3962

stat.S_ISREG(current_path_info[3].st_mode)

3963

and stat.S_IEXEC & current_path_info[3].st_mode)

3964

try:

3965

relpath_unicode = utf8_decode(current_path_info[0])[0]

3966

except UnicodeDecodeError:

3967

raise errors.BadFilenameEncoding(

3968

current_path_info[0], osutils._fs_enc)

3969

yield (None,

3970

(None, relpath_unicode),

3971

True,

3972

(False, False),

3973

(None, None),

3974

(None, utf8_decode(current_path_info[1])[0]),

3975

(None, current_path_info[2]),

3976

(None, new_executable))

3977

# dont descend into this unversioned path if it is

3978

# a dir

3979

if current_path_info[2] in ('directory'):

3980

del current_dir_info[1][path_index]

3981

path_index -= 1

3982

# dont descend the disk iterator into any tree

3983

# paths.

3984

if current_path_info[2] == 'tree-reference':

3985

del current_dir_info[1][path_index]

3986

path_index -= 1

3987

path_index += 1

3988

if path_index < len(current_dir_info[1]):

3989

current_path_info = current_dir_info[1][path_index]

3990

if current_path_info[2] == 'directory':

3991

if self.tree._directory_is_tree_reference(

3992

current_path_info[0].decode('utf8')):

3993

current_path_info = current_path_info[:2] + \

3994

('tree-reference',) + current_path_info[3:]

3995

else:

3996

current_path_info = None

3997

path_handled = False

3998

else:

3999

advance_path = True # reset the advance flagg.

4000

if current_block is not None:

4001

block_index += 1

4002

if (block_index < len(self.state._dirblocks) and

4003

osutils.is_inside(current_root, self.state._dirblocks[block_index][0])):

4004

current_block = self.state._dirblocks[block_index]

4005

else:

4006

current_block = None

4007

if current_dir_info is not None:

4008

try:

4009

current_dir_info = dir_iterator.next()

4010

except StopIteration:

4011

current_dir_info = None

4012

for result in self._iter_specific_file_parents():

4013

yield result

4014

4015

def _iter_specific_file_parents(self):

4016

"""Iter over the specific file parents."""

4017

while self.search_specific_file_parents:

4018

# Process the parent directories for the paths we were iterating.

4019

# Even in extremely large trees this should be modest, so currently

4020

# no attempt is made to optimise.

4021

path_utf8 = self.search_specific_file_parents.pop()

4022

if osutils.is_inside_any(self.searched_specific_files, path_utf8):

4023

# We've examined this path.

4024

continue

4025

if path_utf8 in self.searched_exact_paths:

4026

# We've examined this path.

4027

continue

4028

path_entries = self.state._entries_for_path(path_utf8)

4029

# We need either one or two entries. If the path in

4030

# self.target_index has moved (so the entry in source_index is in

4031

# 'ar') then we need to also look for the entry for this path in

4032

# self.source_index, to output the appropriate delete-or-rename.

4033

selected_entries = []

4034

found_item = False

4035

for candidate_entry in path_entries:

4036

# Find entries present in target at this path:

4037

if candidate_entry[1][self.target_index][0] not in 'ar':

4038

found_item = True

4039

selected_entries.append(candidate_entry)

4040

# Find entries present in source at this path:

4041

elif (self.source_index is not None and

4042

candidate_entry[1][self.source_index][0] not in 'ar'):

4043

found_item = True

4044

if candidate_entry[1][self.target_index][0] == 'a':

4045

# Deleted, emit it here.

4046

selected_entries.append(candidate_entry)

4047

else:

4048

# renamed, emit it when we process the directory it

4049

# ended up at.

4050

self.search_specific_file_parents.add(

4051

candidate_entry[1][self.target_index][1])

4052

if not found_item:

4053

raise AssertionError(

4054

"Missing entry for specific path parent %r, %r" % (

4055

path_utf8, path_entries))

4056

path_info = self._path_info(path_utf8, path_utf8.decode('utf8'))

4057

for entry in selected_entries:

4058

if entry[0][2] in self.seen_ids:

4059

continue

4060

result, changed = self._process_entry(entry, path_info)

4061

if changed is None:

4062

raise AssertionError(

4063

"Got entry<->path mismatch for specific path "

4064

"%r entry %r path_info %r " % (

4065

path_utf8, entry, path_info))

4066

# Only include changes - we're outside the users requested

4067

# expansion.

4068

if changed:

4069

self._gather_result_for_consistency(result)

4070

if (result[6][0] == 'directory' and

4071

result[6][1] != 'directory'):

4072

# This stopped being a directory, the old children have

4073

# to be included.

4074

if entry[1][self.source_index][0] == 'r':

4075

# renamed, take the source path

4076

entry_path_utf8 = entry[1][self.source_index][1]

4077

else:

4078

entry_path_utf8 = path_utf8

4079

initial_key = (entry_path_utf8, '', '')

4080

block_index, _ = self.state._find_block_index_from_key(

4081

initial_key)

4082

if block_index == 0:

4083

# The children of the root are in block index 1.

4084

block_index +=1

4085

current_block = None

4086

if block_index < len(self.state._dirblocks):

4087

current_block = self.state._dirblocks[block_index]

4088

if not osutils.is_inside(

4089

entry_path_utf8, current_block[0]):

4090

# No entries for this directory at all.

4091

current_block = None

4092

if current_block is not None:

4093

for entry in current_block[1]:

4094

if entry[1][self.source_index][0] in 'ar':

4095

# Not in the source tree, so doesn't have to be

4096

# included.

4097

continue

4098

# Path of the entry itself.

4099

4100

self.search_specific_file_parents.add(

4101

osutils.pathjoin(*entry[0][:2]))

4102

if changed or self.include_unchanged:

4103

yield result

4104

self.searched_exact_paths.add(path_utf8)

4105

4106

def _path_info(self, utf8_path, unicode_path):

4107

"""Generate path_info for unicode_path.

4108

4109

:return: None if unicode_path does not exist, or a path_info tuple.

4110

"""

4111

abspath = self.tree.abspath(unicode_path)

4112

try:

4113

stat = os.lstat(abspath)

4114

except OSError, e:

4115

if e.errno == errno.ENOENT:

4116

# the path does not exist.

4117

return None

4118

else:

4119

raise

4120

utf8_basename = utf8_path.rsplit('/', 1)[-1]

4121

dir_info = (utf8_path, utf8_basename,

4122

osutils.file_kind_from_stat_mode(stat.st_mode), stat,

4123

abspath)

4124

if dir_info[2] == 'directory':

4125

if self.tree._directory_is_tree_reference(

4126

unicode_path):

4127

self.root_dir_info = self.root_dir_info[:2] + \

4128

('tree-reference',) + self.root_dir_info[3:]

4129

return dir_info

4130

4131

4132

# Try to load the compiled form if possible

4133

try:

4134

from bzrlib._dirstate_helpers_pyx import (

4135

_read_dirblocks,

4136

bisect_dirblock,

4137

_bisect_path_left,

4138

_bisect_path_right,

4139

cmp_by_dirs,

4140

ProcessEntryC as _process_entry,

4141

update_entry as update_entry,

4142

)

4143

except ImportError, e:

4144

osutils.failed_to_load_extension(e)

4145

from bzrlib._dirstate_helpers_py import (

4146

_read_dirblocks,

4147

bisect_dirblock,

4148

_bisect_path_left,

4149

_bisect_path_right,

4150

cmp_by_dirs,

4151

)

4152

# FIXME: It would be nice to be able to track moved lines so that the

4153

# corresponding python code can be moved to the _dirstate_helpers_py

4154

# module. I don't want to break the history for this important piece of

4155

# code so I left the code here -- vila 20090622

4156

update_entry = py_update_entry

4157

_process_entry = ProcessEntryPython

Older »