/brz/remove-bazaar : revision 4679.9.19

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/chk_map.py

Committer: John Arbash Meinel
Date: 2009-10-23 15:46:01 UTC
mto: This revision was merged to the branch mainline in revision 4771.
Revision ID: john@arbash-meinel.com-20091023154601-2gg0gcbs3s5m90c3

Interning the start and stop group positions saves another 7MB peak mem. \o/

I'm hoping some of this savings is the 'dark memory', but that is unclear at this point.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/history2revfiles.py

tools/http_client.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/chk_map.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Persistent maps from tuple_of_strings->string using CHK stores.

Overview and current status:

The CHKMap class implements a dict from tuple_of_strings->string by using a trie

with internal nodes of 8-bit fan out; The key tuples are mapped to strings by

joining them by \x00, and \x00 padding shorter keys out to the length of the

longest key. Leaf nodes are packed as densely as possible, and internal nodes

are all an additional 8-bits wide leading to a sparse upper tree.

Updates to a CHKMap are done preferentially via the apply_delta method, to

allow optimisation of the update operation; but individual map/unmap calls are

possible and supported. Individual changes via map/unmap are buffered in memory

until the _save method is called to force serialisation of the tree.

apply_delta records its changes immediately by performing an implicit _save.

TODO:

-----

Densely packed upper nodes.

"""

import heapq

from bzrlib import lazy_import

lazy_import.lazy_import(globals(), """

from bzrlib import (

errors,

versionedfile,

)

""")

from bzrlib import (

lru_cache,

osutils,

registry,

trace,

)

from bzrlib.static_tuple import StaticTuple

# approx 4MB

# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan

# out, it takes 3.1MB to cache the layer.

_PAGE_CACHE_SIZE = 4*1024*1024

# We are caching bytes so len(value) is perfectly accurate

_page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

def clear_cache():

_page_cache.clear()

# If a ChildNode falls below this many bytes, we check for a remap

_INTERESTING_NEW_SIZE = 50

# If a ChildNode shrinks by more than this amount, we check for a remap

_INTERESTING_SHRINKAGE_LIMIT = 20

# If we delete more than this many nodes applying a delta, we check for a remap

_INTERESTING_DELETES_LIMIT = 5

def _search_key_plain(key):

"""Map the key tuple into a search string that just uses the key bytes."""

return '\x00'.join(key)

search_key_registry = registry.Registry()

search_key_registry.register('plain', _search_key_plain)

class CHKMap(object):

"""A persistent map from string to string backed by a CHK store."""

__slots__ = ('_store', '_root_node', '_search_key_func')

def __init__(self, store, root_key, search_key_func=None):

"""Create a CHKMap object.

:param store: The store the CHKMap is stored in.

:param root_key: The root key of the map. None to create an empty

CHKMap.

:param search_key_func: A function mapping a key => bytes. These bytes

are then used by the internal nodes to split up leaf nodes into

multiple pages.

"""

self._store = store

100

if search_key_func is None:

101

search_key_func = _search_key_plain

102

self._search_key_func = search_key_func

103

if root_key is None:

104

self._root_node = LeafNode(search_key_func=search_key_func)

105

else:

106

self._root_node = self._node_key(root_key)

107

108

def apply_delta(self, delta):

109

"""Apply a delta to the map.

110

111

:param delta: An iterable of old_key, new_key, new_value tuples.

112

If new_key is not None, then new_key->new_value is inserted

113

into the map; if old_key is not None, then the old mapping

114

of old_key is removed.

115

"""

116

delete_count = 0

117

# Check preconditions first.

118

as_st = StaticTuple.from_sequence

119

new_items = set([as_st(key) for (old, key, value) in delta

120

if key is not None and old is None])

121

existing_new = list(self.iteritems(key_filter=new_items))

122

if existing_new:

123

raise errors.InconsistentDeltaDelta(delta,

124

"New items are already in the map %r." % existing_new)

125

# Now apply changes.

126

for old, new, value in delta:

127

if old is not None and old != new:

128

self.unmap(old, check_remap=False)

129

delete_count += 1

130

for old, new, value in delta:

131

if new is not None:

132

self.map(new, value)

133

if delete_count > _INTERESTING_DELETES_LIMIT:

134

trace.mutter("checking remap as %d deletions", delete_count)

135

self._check_remap()

136

return self._save()

137

138

def _ensure_root(self):

139

"""Ensure that the root node is an object not a key."""

140

if type(self._root_node) is StaticTuple:

141

# Demand-load the root

142

self._root_node = self._get_node(self._root_node)

143

144

def _get_node(self, node):

145

"""Get a node.

146

147

Note that this does not update the _items dict in objects containing a

148

reference to this node. As such it does not prevent subsequent IO being

149

performed.

150

151

:param node: A tuple key or node object.

152

:return: A node object.

153

"""

154

if type(node) is StaticTuple:

155

bytes = self._read_bytes(node)

156

return _deserialise(bytes, node,

157

search_key_func=self._search_key_func)

158

else:

159

return node

160

161

def _read_bytes(self, key):

162

try:

163

return _page_cache[key]

164

except KeyError:

165

stream = self._store.get_record_stream([key], 'unordered', True)

166

bytes = stream.next().get_bytes_as('fulltext')

167

_page_cache[key] = bytes

168

return bytes

169

170

def _dump_tree(self, include_keys=False):

171

"""Return the tree in a string representation."""

172

self._ensure_root()

173

res = self._dump_tree_node(self._root_node, prefix='', indent='',

174

include_keys=include_keys)

175

res.append('') # Give a trailing '\n'

176

return '\n'.join(res)

177

178

def _dump_tree_node(self, node, prefix, indent, include_keys=True):

179

"""For this node and all children, generate a string representation."""

180

result = []

181

if not include_keys:

182

key_str = ''

183

else:

184

node_key = node.key()

185

if node_key is not None:

186

key_str = ' %s' % (node_key[0],)

187

else:

188

key_str = ' None'

189

result.append('%s%r %s%s' % (indent, prefix, node.__class__.__name__,

190

key_str))

191

if type(node) is InternalNode:

192

# Trigger all child nodes to get loaded

193

list(node._iter_nodes(self._store))

194

for prefix, sub in sorted(node._items.iteritems()):

195

result.extend(self._dump_tree_node(sub, prefix, indent + ' ',

196

include_keys=include_keys))

197

else:

198

for key, value in sorted(node._items.iteritems()):

199

# Don't use prefix nor indent here to line up when used in

200

# tests in conjunction with assertEqualDiff

201

result.append(' %r %r' % (tuple(key), value))

202

return result

203

204

@classmethod

205

def from_dict(klass, store, initial_value, maximum_size=0, key_width=1,

206

search_key_func=None):

207

"""Create a CHKMap in store with initial_value as the content.

208

209

:param store: The store to record initial_value in, a VersionedFiles

210

object with 1-tuple keys supporting CHK key generation.

211

:param initial_value: A dict to store in store. Its keys and values

212

must be bytestrings.

213

:param maximum_size: The maximum_size rule to apply to nodes. This

214

determines the size at which no new data is added to a single node.

215

:param key_width: The number of elements in each key_tuple being stored

216

in this map.

217

:param search_key_func: A function mapping a key => bytes. These bytes

218

are then used by the internal nodes to split up leaf nodes into

219

multiple pages.

220

:return: The root chk of the resulting CHKMap.

221

"""

222

root_key = klass._create_directly(store, initial_value,

223

maximum_size=maximum_size, key_width=key_width,

224

search_key_func=search_key_func)

225

if type(root_key) is not StaticTuple:

226

raise AssertionError('we got a %s instead of a StaticTuple'

227

% (type(root_key),))

228

return root_key

229

230

@classmethod

231

def _create_via_map(klass, store, initial_value, maximum_size=0,

232

key_width=1, search_key_func=None):

233

result = klass(store, None, search_key_func=search_key_func)

234

result._root_node.set_maximum_size(maximum_size)

235

result._root_node._key_width = key_width

236

delta = []

237

for key, value in initial_value.items():

238

delta.append((None, key, value))

239

root_key = result.apply_delta(delta)

240

return root_key

241

242

@classmethod

243

def _create_directly(klass, store, initial_value, maximum_size=0,

244

key_width=1, search_key_func=None):

245

node = LeafNode(search_key_func=search_key_func)

246

node.set_maximum_size(maximum_size)

247

node._key_width = key_width

248

as_st = StaticTuple.from_sequence

249

node._items = dict([(as_st(key), val) for key, val

250

in initial_value.iteritems()])

251

node._raw_size = sum([node._key_value_len(key, value)

252

for key,value in node._items.iteritems()])

253

node._len = len(node._items)

254

node._compute_search_prefix()

255

node._compute_serialised_prefix()

256

if (node._len > 1

257

and maximum_size

258

and node._current_size() > maximum_size):

259

prefix, node_details = node._split(store)

260

if len(node_details) == 1:

261

raise AssertionError('Failed to split using node._split')

262

node = InternalNode(prefix, search_key_func=search_key_func)

263

node.set_maximum_size(maximum_size)

264

node._key_width = key_width

265

for split, subnode in node_details:

266

node.add_node(split, subnode)

267

keys = list(node.serialise(store))

268

return keys[-1]

269

270

def iter_changes(self, basis):

271

"""Iterate over the changes between basis and self.

272

273

:return: An iterator of tuples: (key, old_value, new_value). Old_value

274

is None for keys only in self; new_value is None for keys only in

275

basis.

276

"""

277

# Overview:

278

# Read both trees in lexographic, highest-first order.

279

# Any identical nodes we skip

280

# Any unique prefixes we output immediately.

281

# values in a leaf node are treated as single-value nodes in the tree

282

# which allows them to be not-special-cased. We know to output them

283

# because their value is a string, not a key(tuple) or node.

284

285

# corner cases to beware of when considering this function:

286

# *) common references are at different heights.

287

# consider two trees:

288

# {'a': LeafNode={'aaa':'foo', 'aab':'bar'}, 'b': LeafNode={'b'}}

289

# {'a': InternalNode={'aa':LeafNode={'aaa':'foo', 'aab':'bar'},

290

# 'ab':LeafNode={'ab':'bar'}}

291

# 'b': LeafNode={'b'}}

292

# the node with aaa/aab will only be encountered in the second tree

293

# after reading the 'a' subtree, but it is encountered in the first

294

# tree immediately. Variations on this may have read internal nodes

295

# like this. we want to cut the entire pending subtree when we

296

# realise we have a common node. For this we use a list of keys -

297

# the path to a node - and check the entire path is clean as we

298

# process each item.

299

if self._node_key(self._root_node) == self._node_key(basis._root_node):

300

return

301

self._ensure_root()

302

basis._ensure_root()

303

excluded_keys = set()

304

self_node = self._root_node

305

basis_node = basis._root_node

306

# A heap, each element is prefix, node(tuple/NodeObject/string),

307

# key_path (a list of tuples, tail-sharing down the tree.)

308

self_pending = []

309

basis_pending = []

310

def process_node(node, path, a_map, pending):

311

# take a node and expand it

312

node = a_map._get_node(node)

313

if type(node) == LeafNode:

314

path = (node._key, path)

315

for key, value in node._items.items():

316

# For a LeafNode, the key is a serialized_key, rather than

317

# a search_key, but the heap is using search_keys

318

search_key = node._search_key_func(key)

319

heapq.heappush(pending, (search_key, key, value, path))

320

else:

321

# type(node) == InternalNode

322

path = (node._key, path)

323

for prefix, child in node._items.items():

324

heapq.heappush(pending, (prefix, None, child, path))

325

def process_common_internal_nodes(self_node, basis_node):

326

self_items = set(self_node._items.items())

327

basis_items = set(basis_node._items.items())

328

path = (self_node._key, None)

329

for prefix, child in self_items - basis_items:

330

heapq.heappush(self_pending, (prefix, None, child, path))

331

path = (basis_node._key, None)

332

for prefix, child in basis_items - self_items:

333

heapq.heappush(basis_pending, (prefix, None, child, path))

334

def process_common_leaf_nodes(self_node, basis_node):

335

self_items = set(self_node._items.items())

336

basis_items = set(basis_node._items.items())

337

path = (self_node._key, None)

338

for key, value in self_items - basis_items:

339

prefix = self._search_key_func(key)

340

heapq.heappush(self_pending, (prefix, key, value, path))

341

path = (basis_node._key, None)

342

for key, value in basis_items - self_items:

343

prefix = basis._search_key_func(key)

344

heapq.heappush(basis_pending, (prefix, key, value, path))

345

def process_common_prefix_nodes(self_node, self_path,

346

basis_node, basis_path):

347

# Would it be more efficient if we could request both at the same

348

# time?

349

self_node = self._get_node(self_node)

350

basis_node = basis._get_node(basis_node)

351

if (type(self_node) == InternalNode

352

and type(basis_node) == InternalNode):

353

# Matching internal nodes

354

process_common_internal_nodes(self_node, basis_node)

355

elif (type(self_node) == LeafNode

356

and type(basis_node) == LeafNode):

357

process_common_leaf_nodes(self_node, basis_node)

358

else:

359

process_node(self_node, self_path, self, self_pending)

360

process_node(basis_node, basis_path, basis, basis_pending)

361

process_common_prefix_nodes(self_node, None, basis_node, None)

362

self_seen = set()

363

basis_seen = set()

364

excluded_keys = set()

365

def check_excluded(key_path):

366

# Note that this is N^2, it depends on us trimming trees

367

# aggressively to not become slow.

368

# A better implementation would probably have a reverse map

369

# back to the children of a node, and jump straight to it when

370

# a common node is detected, the proceed to remove the already

371

# pending children. bzrlib.graph has a searcher module with a

372

# similar problem.

373

while key_path is not None:

374

key, key_path = key_path

375

if key in excluded_keys:

376

return True

377

return False

378

379

loop_counter = 0

380

while self_pending or basis_pending:

381

loop_counter += 1

382

if not self_pending:

383

# self is exhausted: output remainder of basis

384

for prefix, key, node, path in basis_pending:

385

if check_excluded(path):

386

continue

387

node = basis._get_node(node)

388

if key is not None:

389

# a value

390

yield (key, node, None)

391

else:

392

# subtree - fastpath the entire thing.

393

for key, value in node.iteritems(basis._store):

394

yield (key, value, None)

395

return

396

elif not basis_pending:

397

# basis is exhausted: output remainder of self.

398

for prefix, key, node, path in self_pending:

399

if check_excluded(path):

400

continue

401

node = self._get_node(node)

402

if key is not None:

403

# a value

404

yield (key, None, node)

405

else:

406

# subtree - fastpath the entire thing.

407

for key, value in node.iteritems(self._store):

408

yield (key, None, value)

409

return

410

else:

411

# XXX: future optimisation - yield the smaller items

412

# immediately rather than pushing everything on/off the

413

# heaps. Applies to both internal nodes and leafnodes.

414

if self_pending[0][0] < basis_pending[0][0]:

415

# expand self

416

prefix, key, node, path = heapq.heappop(self_pending)

417

if check_excluded(path):

418

continue

419

if key is not None:

420

# a value

421

yield (key, None, node)

422

else:

423

process_node(node, path, self, self_pending)

424

continue

425

elif self_pending[0][0] > basis_pending[0][0]:

426

# expand basis

427

prefix, key, node, path = heapq.heappop(basis_pending)

428

if check_excluded(path):

429

continue

430

if key is not None:

431

# a value

432

yield (key, node, None)

433

else:

434

process_node(node, path, basis, basis_pending)

435

continue

436

else:

437

# common prefix: possibly expand both

438

if self_pending[0][1] is None:

439

# process next self

440

read_self = True

441

else:

442

read_self = False

443

if basis_pending[0][1] is None:

444

# process next basis

445

read_basis = True

446

else:

447

read_basis = False

448

if not read_self and not read_basis:

449

# compare a common value

450

self_details = heapq.heappop(self_pending)

451

basis_details = heapq.heappop(basis_pending)

452

if self_details[2] != basis_details[2]:

453

yield (self_details[1],

454

basis_details[2], self_details[2])

455

continue

456

# At least one side wasn't a simple value

457

if (self._node_key(self_pending[0][2]) ==

458

self._node_key(basis_pending[0][2])):

459

# Identical pointers, skip (and don't bother adding to

460

# excluded, it won't turn up again.

461

heapq.heappop(self_pending)

462

heapq.heappop(basis_pending)

463

continue

464

# Now we need to expand this node before we can continue

465

if read_self and read_basis:

466

# Both sides start with the same prefix, so process

467

# them in parallel

468

self_prefix, _, self_node, self_path = heapq.heappop(

469

self_pending)

470

basis_prefix, _, basis_node, basis_path = heapq.heappop(

471

basis_pending)

472

if self_prefix != basis_prefix:

473

raise AssertionError(

474

'%r != %r' % (self_prefix, basis_prefix))

475

process_common_prefix_nodes(

476

self_node, self_path,

477

basis_node, basis_path)

478

continue

479

if read_self:

480

prefix, key, node, path = heapq.heappop(self_pending)

481

if check_excluded(path):

482

continue

483

process_node(node, path, self, self_pending)

484

if read_basis:

485

prefix, key, node, path = heapq.heappop(basis_pending)

486

if check_excluded(path):

487

continue

488

process_node(node, path, basis, basis_pending)

489

# print loop_counter

490

491

def iteritems(self, key_filter=None):

492

"""Iterate over the entire CHKMap's contents."""

493

self._ensure_root()

494

if key_filter is not None:

495

as_st = StaticTuple.from_sequence

496

key_filter = [as_st(key) for key in key_filter]

497

return self._root_node.iteritems(self._store, key_filter=key_filter)

498

499

def key(self):

500

"""Return the key for this map."""

501

if type(self._root_node) is StaticTuple:

502

return self._root_node

503

else:

504

return self._root_node._key

505

506

def __len__(self):

507

self._ensure_root()

508

return len(self._root_node)

509

510

def map(self, key, value):

511

"""Map a key tuple to value.

512

513

:param key: A key to map.

514

:param value: The value to assign to key.

515

"""

516

key = StaticTuple.from_sequence(key)

517

# Need a root object.

518

self._ensure_root()

519

prefix, node_details = self._root_node.map(self._store, key, value)

520

if len(node_details) == 1:

521

self._root_node = node_details[0][1]

522

else:

523

self._root_node = InternalNode(prefix,

524

search_key_func=self._search_key_func)

525

self._root_node.set_maximum_size(node_details[0][1].maximum_size)

526

self._root_node._key_width = node_details[0][1]._key_width

527

for split, node in node_details:

528

self._root_node.add_node(split, node)

529

530

def _node_key(self, node):

531

"""Get the key for a node whether it's a tuple or node."""

532

if type(node) is tuple:

533

node = StaticTuple.from_sequence(node)

534

if type(node) is StaticTuple:

535

return node

536

else:

537

return node._key

538

539

def unmap(self, key, check_remap=True):

540

"""remove key from the map."""

541

key = StaticTuple.from_sequence(key)

542

self._ensure_root()

543

if type(self._root_node) is InternalNode:

544

unmapped = self._root_node.unmap(self._store, key,

545

check_remap=check_remap)

546

else:

547

unmapped = self._root_node.unmap(self._store, key)

548

self._root_node = unmapped

549

550

def _check_remap(self):

551

"""Check if nodes can be collapsed."""

552

self._ensure_root()

553

if type(self._root_node) is InternalNode:

554

self._root_node._check_remap(self._store)

555

556

def _save(self):

557

"""Save the map completely.

558

559

:return: The key of the root node.

560

"""

561

if type(self._root_node) is StaticTuple:

562

# Already saved.

563

return self._root_node

564

keys = list(self._root_node.serialise(self._store))

565

return keys[-1]

566

567

568

class Node(object):

569

"""Base class defining the protocol for CHK Map nodes.

570

571

:ivar _raw_size: The total size of the serialized key:value data, before

572

adding the header bytes, and without prefix compression.

573

"""

574

575

__slots__ = ('_key', '_len', '_maximum_size', '_key_width',

576

'_raw_size', '_items', '_search_prefix', '_search_key_func'

577

)

578

579

def __init__(self, key_width=1):

580

"""Create a node.

581

582

:param key_width: The width of keys for this node.

583

"""

584

self._key = None

585

# Current number of elements

586

self._len = 0

587

self._maximum_size = 0

588

self._key_width = key_width

589

# current size in bytes

590

self._raw_size = 0

591

# The pointers/values this node has - meaning defined by child classes.

592

self._items = {}

593

# The common search prefix

594

self._search_prefix = None

595

596

def __repr__(self):

597

items_str = str(sorted(self._items))

598

if len(items_str) > 20:

599

items_str = items_str[:16] + '...]'

600

return '%s(key:%s len:%s size:%s max:%s prefix:%s items:%s)' % (

601

self.__class__.__name__, self._key, self._len, self._raw_size,

602

self._maximum_size, self._search_prefix, items_str)

603

604

def key(self):

605

return self._key

606

607

def __len__(self):

608

return self._len

609

610

@property

611

def maximum_size(self):

612

"""What is the upper limit for adding references to a node."""

613

return self._maximum_size

614

615

def set_maximum_size(self, new_size):

616

"""Set the size threshold for nodes.

617

618

:param new_size: The size at which no data is added to a node. 0 for

619

unlimited.

620

"""

621

self._maximum_size = new_size

622

623

@classmethod

624

def common_prefix(cls, prefix, key):

625

"""Given 2 strings, return the longest prefix common to both.

626

627

:param prefix: This has been the common prefix for other keys, so it is

628

more likely to be the common prefix in this case as well.

629

:param key: Another string to compare to

630

"""

631

if key.startswith(prefix):

632

return prefix

633

pos = -1

634

# Is there a better way to do this?

635

for pos, (left, right) in enumerate(zip(prefix, key)):

636

if left != right:

637

pos -= 1

638

break

639

common = prefix[:pos+1]

640

return common

641

642

@classmethod

643

def common_prefix_for_keys(cls, keys):

644

"""Given a list of keys, find their common prefix.

645

646

:param keys: An iterable of strings.

647

:return: The longest common prefix of all keys.

648

"""

649

common_prefix = None

650

for key in keys:

651

if common_prefix is None:

652

common_prefix = key

653

continue

654

common_prefix = cls.common_prefix(common_prefix, key)

655

if not common_prefix:

656

# if common_prefix is the empty string, then we know it won't

657

# change further

658

return ''

659

return common_prefix

660

661

662

# Singleton indicating we have not computed _search_prefix yet

663

_unknown = object()

664

665

class LeafNode(Node):

666

"""A node containing actual key:value pairs.

667

668

:ivar _items: A dict of key->value items. The key is in tuple form.

669

:ivar _size: The number of bytes that would be used by serializing all of

670

the key/value pairs.

671

"""

672

673

__slots__ = ('_common_serialised_prefix', '_serialise_key')

674

675

def __init__(self, search_key_func=None):

676

Node.__init__(self)

677

# All of the keys in this leaf node share this common prefix

678

self._common_serialised_prefix = None

679

self._serialise_key = '\x00'.join

680

if search_key_func is None:

681

self._search_key_func = _search_key_plain

682

else:

683

self._search_key_func = search_key_func

684

685

def __repr__(self):

686

items_str = str(sorted(self._items))

687

if len(items_str) > 20:

688

items_str = items_str[:16] + '...]'

689

return \

690

'%s(key:%s len:%s size:%s max:%s prefix:%s keywidth:%s items:%s)' \

691

% (self.__class__.__name__, self._key, self._len, self._raw_size,

692

self._maximum_size, self._search_prefix, self._key_width, items_str)

693

694

def _current_size(self):

695

"""Answer the current serialised size of this node.

696

697

This differs from self._raw_size in that it includes the bytes used for

698

the header.

699

"""

700

if self._common_serialised_prefix is None:

701

bytes_for_items = 0

702

prefix_len = 0

703

else:

704

# We will store a single string with the common prefix

705

# And then that common prefix will not be stored in any of the

706

# entry lines

707

prefix_len = len(self._common_serialised_prefix)

708

bytes_for_items = (self._raw_size - (prefix_len * self._len))

709

return (9 # 'chkleaf:\n'

710

+ len(str(self._maximum_size)) + 1

711

+ len(str(self._key_width)) + 1

712

+ len(str(self._len)) + 1

713

+ prefix_len + 1

714

+ bytes_for_items)

715

716

@classmethod

717

def deserialise(klass, bytes, key, search_key_func=None):

718

"""Deserialise bytes, with key key, into a LeafNode.

719

720

:param bytes: The bytes of the node.

721

:param key: The key that the serialised node has.

722

"""

723

return _deserialise_leaf_node(bytes, key,

724

search_key_func=search_key_func)

725

726

def iteritems(self, store, key_filter=None):

727

"""Iterate over items in the node.

728

729

:param key_filter: A filter to apply to the node. It should be a

730

list/set/dict or similar repeatedly iterable container.

731

"""

732

if key_filter is not None:

733

# Adjust the filter - short elements go to a prefix filter. All

734

# other items are looked up directly.

735

# XXX: perhaps defaultdict? Profiling<rinse and repeat>

736

filters = {}

737

for key in key_filter:

738

if len(key) == self._key_width:

739

# This filter is meant to match exactly one key, yield it

740

# if we have it.

741

try:

742

yield key, self._items[key]

743

except KeyError:

744

# This key is not present in this map, continue

745

pass

746

else:

747

# Short items, we need to match based on a prefix

748

length_filter = filters.setdefault(len(key), set())

749

length_filter.add(key)

750

if filters:

751

filters = filters.items()

752

for item in self._items.iteritems():

753

for length, length_filter in filters:

754

if item[0][:length] in length_filter:

755

yield item

756

break

757

else:

758

for item in self._items.iteritems():

759

yield item

760

761

def _key_value_len(self, key, value):

762

# TODO: Should probably be done without actually joining the key, but

763

# then that can be done via the C extension

764

return (len(self._serialise_key(key)) + 1

765

+ len(str(value.count('\n'))) + 1

766

+ len(value) + 1)

767

768

def _search_key(self, key):

769

return self._search_key_func(key)

770

771

def _map_no_split(self, key, value):

772

"""Map a key to a value.

773

774

This assumes either the key does not already exist, or you have already

775

removed its size and length from self.

776

777

:return: True if adding this node should cause us to split.

778

"""

779

self._items[key] = value

780

self._raw_size += self._key_value_len(key, value)

781

self._len += 1

782

serialised_key = self._serialise_key(key)

783

if self._common_serialised_prefix is None:

784

self._common_serialised_prefix = serialised_key

785

else:

786

self._common_serialised_prefix = self.common_prefix(

787

self._common_serialised_prefix, serialised_key)

788

search_key = self._search_key(key)

789

if self._search_prefix is _unknown:

790

self._compute_search_prefix()

791

if self._search_prefix is None:

792

self._search_prefix = search_key

793

else:

794

self._search_prefix = self.common_prefix(

795

self._search_prefix, search_key)

796

if (self._len > 1

797

and self._maximum_size

798

and self._current_size() > self._maximum_size):

799

# Check to see if all of the search_keys for this node are

800

# identical. We allow the node to grow under that circumstance

801

# (we could track this as common state, but it is infrequent)

802

if (search_key != self._search_prefix

803

or not self._are_search_keys_identical()):

804

return True

805

return False

806

807

def _split(self, store):

808

"""We have overflowed.

809

810

Split this node into multiple LeafNodes, return it up the stack so that

811

the next layer creates a new InternalNode and references the new nodes.

812

813

:return: (common_serialised_prefix, [(node_serialised_prefix, node)])

814

"""

815

if self._search_prefix is _unknown:

816

raise AssertionError('Search prefix must be known')

817

common_prefix = self._search_prefix

818

split_at = len(common_prefix) + 1

819

result = {}

820

for key, value in self._items.iteritems():

821

search_key = self._search_key(key)

822

prefix = search_key[:split_at]

823

# TODO: Generally only 1 key can be exactly the right length,

824

# which means we can only have 1 key in the node pointed

825

# at by the 'prefix\0' key. We might want to consider

826

# folding it into the containing InternalNode rather than

827

# having a fixed length-1 node.

828

# Note this is probably not true for hash keys, as they

829

# may get a '\00' node anywhere, but won't have keys of

830

# different lengths.

831

if len(prefix) < split_at:

832

prefix += '\x00'*(split_at - len(prefix))

833

if prefix not in result:

834

node = LeafNode(search_key_func=self._search_key_func)

835

node.set_maximum_size(self._maximum_size)

836

node._key_width = self._key_width

837

result[prefix] = node

838

else:

839

node = result[prefix]

840

sub_prefix, node_details = node.map(store, key, value)

841

if len(node_details) > 1:

842

if prefix != sub_prefix:

843

# This node has been split and is now found via a different

844

# path

845

result.pop(prefix)

846

new_node = InternalNode(sub_prefix,

847

search_key_func=self._search_key_func)

848

new_node.set_maximum_size(self._maximum_size)

849

new_node._key_width = self._key_width

850

for split, node in node_details:

851

new_node.add_node(split, node)

852

result[prefix] = new_node

853

return common_prefix, result.items()

854

855

def map(self, store, key, value):

856

"""Map key to value."""

857

if key in self._items:

858

self._raw_size -= self._key_value_len(key, self._items[key])

859

self._len -= 1

860

self._key = None

861

if self._map_no_split(key, value):

862

return self._split(store)

863

else:

864

if self._search_prefix is _unknown:

865

raise AssertionError('%r must be known' % self._search_prefix)

866

return self._search_prefix, [("", self)]

867

868

def serialise(self, store):

869

"""Serialise the LeafNode to store.

870

871

:param store: A VersionedFiles honouring the CHK extensions.

872

:return: An iterable of the keys inserted by this operation.

873

"""

874

lines = ["chkleaf:\n"]

875

lines.append("%d\n" % self._maximum_size)

876

lines.append("%d\n" % self._key_width)

877

lines.append("%d\n" % self._len)

878

if self._common_serialised_prefix is None:

879

lines.append('\n')

880

if len(self._items) != 0:

881

raise AssertionError('If _common_serialised_prefix is None'

882

' we should have no items')

883

else:

884

lines.append('%s\n' % (self._common_serialised_prefix,))

885

prefix_len = len(self._common_serialised_prefix)

886

for key, value in sorted(self._items.items()):

887

# Always add a final newline

888

value_lines = osutils.chunks_to_lines([value + '\n'])

889

serialized = "%s\x00%s\n" % (self._serialise_key(key),

890

len(value_lines))

891

if not serialized.startswith(self._common_serialised_prefix):

892

raise AssertionError('We thought the common prefix was %r'

893

' but entry %r does not have it in common'

894

% (self._common_serialised_prefix, serialized))

895

lines.append(serialized[prefix_len:])

896

lines.extend(value_lines)

897

sha1, _, _ = store.add_lines((None,), (), lines)

898

self._key = StaticTuple("sha1:" + sha1,).intern()

899

bytes = ''.join(lines)

900

if len(bytes) != self._current_size():

901

raise AssertionError('Invalid _current_size')

902

_page_cache.add(self._key, bytes)

903

return [self._key]

904

905

def refs(self):

906

"""Return the references to other CHK's held by this node."""

907

return []

908

909

def _compute_search_prefix(self):

910

"""Determine the common search prefix for all keys in this node.

911

912

:return: A bytestring of the longest search key prefix that is

913

unique within this node.

914

"""

915

search_keys = [self._search_key_func(key) for key in self._items]

916

self._search_prefix = self.common_prefix_for_keys(search_keys)

917

return self._search_prefix

918

919

def _are_search_keys_identical(self):

920

"""Check to see if the search keys for all entries are the same.

921

922

When using a hash as the search_key it is possible for non-identical

923

keys to collide. If that happens enough, we may try overflow a

924

LeafNode, but as all are collisions, we must not split.

925

"""

926

common_search_key = None

927

for key in self._items:

928

search_key = self._search_key(key)

929

if common_search_key is None:

930

common_search_key = search_key

931

elif search_key != common_search_key:

932

return False

933

return True

934

935

def _compute_serialised_prefix(self):

936

"""Determine the common prefix for serialised keys in this node.

937

938

:return: A bytestring of the longest serialised key prefix that is

939

unique within this node.

940

"""

941

serialised_keys = [self._serialise_key(key) for key in self._items]

942

self._common_serialised_prefix = self.common_prefix_for_keys(

943

serialised_keys)

944

return self._common_serialised_prefix

945

946

def unmap(self, store, key):

947

"""Unmap key from the node."""

948

try:

949

self._raw_size -= self._key_value_len(key, self._items[key])

950

except KeyError:

951

trace.mutter("key %s not found in %r", key, self._items)

952

raise

953

self._len -= 1

954

del self._items[key]

955

self._key = None

956

# Recompute from scratch

957

self._compute_search_prefix()

958

self._compute_serialised_prefix()

959

return self

960

961

962

class InternalNode(Node):

963

"""A node that contains references to other nodes.

964

965

An InternalNode is responsible for mapping search key prefixes to child

966

nodes.

967

968

:ivar _items: serialised_key => node dictionary. node may be a tuple,

969

LeafNode or InternalNode.

970

"""

971

972

__slots__ = ('_node_width',)

973

974

def __init__(self, prefix='', search_key_func=None):

975

Node.__init__(self)

976

# The size of an internalnode with default values and no children.

977

# How many octets key prefixes within this node are.

978

self._node_width = 0

979

self._search_prefix = prefix

980

if search_key_func is None:

981

self._search_key_func = _search_key_plain

982

else:

983

self._search_key_func = search_key_func

984

985

def add_node(self, prefix, node):

986

"""Add a child node with prefix prefix, and node node.

987

988

:param prefix: The search key prefix for node.

989

:param node: The node being added.

990

"""

991

if self._search_prefix is None:

992

raise AssertionError("_search_prefix should not be None")

993

if not prefix.startswith(self._search_prefix):

994

raise AssertionError("prefixes mismatch: %s must start with %s"

995

% (prefix,self._search_prefix))

996

if len(prefix) != len(self._search_prefix) + 1:

997

raise AssertionError("prefix wrong length: len(%s) is not %d" %

998

(prefix, len(self._search_prefix) + 1))

999

self._len += len(node)

1000

if not len(self._items):

1001

self._node_width = len(prefix)

1002

if self._node_width != len(self._search_prefix) + 1:

1003

raise AssertionError("node width mismatch: %d is not %d" %

1004

(self._node_width, len(self._search_prefix) + 1))

1005

self._items[prefix] = node

1006

self._key = None

1007

1008

def _current_size(self):

1009

"""Answer the current serialised size of this node."""

1010

return (self._raw_size + len(str(self._len)) + len(str(self._key_width)) +

1011

len(str(self._maximum_size)))

1012

1013

@classmethod

1014

def deserialise(klass, bytes, key, search_key_func=None):

1015

"""Deserialise bytes to an InternalNode, with key key.

1016

1017

:param bytes: The bytes of the node.

1018

:param key: The key that the serialised node has.

1019

:return: An InternalNode instance.

1020

"""

1021

if type(key) is not StaticTuple:

1022

raise AssertionError('deserialise should be called with a'

1023

' StaticTuple not %s' % (type(key),))

1024

return _deserialise_internal_node(bytes, key,

1025

search_key_func=search_key_func)

1026

1027

def iteritems(self, store, key_filter=None):

1028

for node, node_filter in self._iter_nodes(store, key_filter=key_filter):

1029

for item in node.iteritems(store, key_filter=node_filter):

1030

yield item

1031

1032

def _iter_nodes(self, store, key_filter=None, batch_size=None):

1033

"""Iterate over node objects which match key_filter.

1034

1035

:param store: A store to use for accessing content.

1036

:param key_filter: A key filter to filter nodes. Only nodes that might

1037

contain a key in key_filter will be returned.

1038

:param batch_size: If not None, then we will return the nodes that had

1039

to be read using get_record_stream in batches, rather than reading

1040

them all at once.

1041

:return: An iterable of nodes. This function does not have to be fully

1042

consumed. (There will be no pending I/O when items are being returned.)

1043

"""

1044

# Map from chk key ('sha1:...',) to (prefix, key_filter)

1045

# prefix is the key in self._items to use, key_filter is the key_filter

1046

# entries that would match this node

1047

keys = {}

1048

shortcut = False

1049

if key_filter is None:

1050

# yielding all nodes, yield whatever we have, and queue up a read

1051

# for whatever we are missing

1052

shortcut = True

1053

for prefix, node in self._items.iteritems():

1054

if node.__class__ is StaticTuple:

1055

keys[node] = (prefix, None)

1056

else:

1057

yield node, None

1058

elif len(key_filter) == 1:

1059

# Technically, this path could also be handled by the first check

1060

# in 'self._node_width' in length_filters. However, we can handle

1061

# this case without spending any time building up the

1062

# prefix_to_keys, etc state.

1063

1064

# This is a bit ugly, but TIMEIT showed it to be by far the fastest

1065

# 0.626us list(key_filter)[0]

1066

# is a func() for list(), 2 mallocs, and a getitem

1067

# 0.489us [k for k in key_filter][0]

1068

# still has the mallocs, avoids the func() call

1069

# 0.350us iter(key_filter).next()

1070

# has a func() call, and mallocs an iterator

1071

# 0.125us for key in key_filter: pass

1072

# no func() overhead, might malloc an iterator

1073

# 0.105us for key in key_filter: break

1074

# no func() overhead, might malloc an iterator, probably

1075

# avoids checking an 'else' clause as part of the for

1076

for key in key_filter:

1077

break

1078

search_prefix = self._search_prefix_filter(key)

1079

if len(search_prefix) == self._node_width:

1080

# This item will match exactly, so just do a dict lookup, and

1081

# see what we can return

1082

shortcut = True

1083

try:

1084

node = self._items[search_prefix]

1085

except KeyError:

1086

# A given key can only match 1 child node, if it isn't

1087

# there, then we can just return nothing

1088

return

1089

if node.__class__ is StaticTuple:

1090

keys[node] = (search_prefix, [key])

1091

else:

1092

# This is loaded, and the only thing that can match,

1093

# return

1094

yield node, [key]

1095

return

1096

if not shortcut:

1097

# First, convert all keys into a list of search prefixes

1098

# Aggregate common prefixes, and track the keys they come from

1099

prefix_to_keys = {}

1100

length_filters = {}

1101

for key in key_filter:

1102

search_prefix = self._search_prefix_filter(key)

1103

length_filter = length_filters.setdefault(

1104

len(search_prefix), set())

1105

length_filter.add(search_prefix)

1106

prefix_to_keys.setdefault(search_prefix, []).append(key)

1107

1108

if (self._node_width in length_filters

1109

and len(length_filters) == 1):

1110

# all of the search prefixes match exactly _node_width. This

1111

# means that everything is an exact match, and we can do a

1112

# lookup into self._items, rather than iterating over the items

1113

# dict.

1114

search_prefixes = length_filters[self._node_width]

1115

for search_prefix in search_prefixes:

1116

try:

1117

node = self._items[search_prefix]

1118

except KeyError:

1119

# We can ignore this one

1120

continue

1121

node_key_filter = prefix_to_keys[search_prefix]

1122

if node.__class__ is StaticTuple:

1123

keys[node] = (search_prefix, node_key_filter)

1124

else:

1125

yield node, node_key_filter

1126

else:

1127

# The slow way. We walk every item in self._items, and check to

1128

# see if there are any matches

1129

length_filters = length_filters.items()

1130

for prefix, node in self._items.iteritems():

1131

node_key_filter = []

1132

for length, length_filter in length_filters:

1133

sub_prefix = prefix[:length]

1134

if sub_prefix in length_filter:

1135

node_key_filter.extend(prefix_to_keys[sub_prefix])

1136

if node_key_filter: # this key matched something, yield it

1137

if node.__class__ is StaticTuple:

1138

keys[node] = (prefix, node_key_filter)

1139

else:

1140

yield node, node_key_filter

1141

if keys:

1142

# Look in the page cache for some more bytes

1143

found_keys = set()

1144

for key in keys:

1145

try:

1146

bytes = _page_cache[key]

1147

except KeyError:

1148

continue

1149

else:

1150

node = _deserialise(bytes, key,

1151

search_key_func=self._search_key_func)

1152

prefix, node_key_filter = keys[key]

1153

self._items[prefix] = node

1154

found_keys.add(key)

1155

yield node, node_key_filter

1156

for key in found_keys:

1157

del keys[key]

1158

if keys:

1159

# demand load some pages.

1160

if batch_size is None:

1161

# Read all the keys in

1162

batch_size = len(keys)

1163

key_order = list(keys)

1164

for batch_start in range(0, len(key_order), batch_size):

1165

batch = key_order[batch_start:batch_start + batch_size]

1166

# We have to fully consume the stream so there is no pending

1167

# I/O, so we buffer the nodes for now.

1168

stream = store.get_record_stream(batch, 'unordered', True)

1169

node_and_filters = []

1170

for record in stream:

1171

bytes = record.get_bytes_as('fulltext')

1172

node = _deserialise(bytes, record.key,

1173

search_key_func=self._search_key_func)

1174

prefix, node_key_filter = keys[record.key]

1175

node_and_filters.append((node, node_key_filter))

1176

self._items[prefix] = node

1177

_page_cache.add(record.key, bytes)

1178

for info in node_and_filters:

1179

yield info

1180

1181

def map(self, store, key, value):

1182

"""Map key to value."""

1183

if not len(self._items):

1184

raise AssertionError("can't map in an empty InternalNode.")

1185

search_key = self._search_key(key)

1186

if self._node_width != len(self._search_prefix) + 1:

1187

raise AssertionError("node width mismatch: %d is not %d" %

1188

(self._node_width, len(self._search_prefix) + 1))

1189

if not search_key.startswith(self._search_prefix):

1190

# This key doesn't fit in this index, so we need to split at the

1191

# point where it would fit, insert self into that internal node,

1192

# and then map this key into that node.

1193

new_prefix = self.common_prefix(self._search_prefix,

1194

search_key)

1195

new_parent = InternalNode(new_prefix,

1196

search_key_func=self._search_key_func)

1197

new_parent.set_maximum_size(self._maximum_size)

1198

new_parent._key_width = self._key_width

1199

new_parent.add_node(self._search_prefix[:len(new_prefix)+1],

1200

self)

1201

return new_parent.map(store, key, value)

1202

children = [node for node, _

1203

in self._iter_nodes(store, key_filter=[key])]

1204

if children:

1205

child = children[0]

1206

else:

1207

# new child needed:

1208

child = self._new_child(search_key, LeafNode)

1209

old_len = len(child)

1210

if type(child) is LeafNode:

1211

old_size = child._current_size()

1212

else:

1213

old_size = None

1214

prefix, node_details = child.map(store, key, value)

1215

if len(node_details) == 1:

1216

# child may have shrunk, or might be a new node

1217

child = node_details[0][1]

1218

self._len = self._len - old_len + len(child)

1219

self._items[search_key] = child

1220

self._key = None

1221

new_node = self

1222

if type(child) is LeafNode:

1223

if old_size is None:

1224

# The old node was an InternalNode which means it has now

1225

# collapsed, so we need to check if it will chain to a

1226

# collapse at this level.

1227

trace.mutter("checking remap as InternalNode -> LeafNode")

1228

new_node = self._check_remap(store)

1229

else:

1230

# If the LeafNode has shrunk in size, we may want to run

1231

# a remap check. Checking for a remap is expensive though

1232

# and the frequency of a successful remap is very low.

1233

# Shrinkage by small amounts is common, so we only do the

1234

# remap check if the new_size is low or the shrinkage

1235

# amount is over a configurable limit.

1236

new_size = child._current_size()

1237

shrinkage = old_size - new_size

1238

if (shrinkage > 0 and new_size < _INTERESTING_NEW_SIZE

1239

or shrinkage > _INTERESTING_SHRINKAGE_LIMIT):

1240

trace.mutter(

1241

"checking remap as size shrunk by %d to be %d",

1242

shrinkage, new_size)

1243

new_node = self._check_remap(store)

1244

if new_node._search_prefix is None:

1245

raise AssertionError("_search_prefix should not be None")

1246

return new_node._search_prefix, [('', new_node)]

1247

# child has overflown - create a new intermediate node.

1248

# XXX: This is where we might want to try and expand our depth

1249

# to refer to more bytes of every child (which would give us

1250

# multiple pointers to child nodes, but less intermediate nodes)

1251

child = self._new_child(search_key, InternalNode)

1252

child._search_prefix = prefix

1253

for split, node in node_details:

1254

child.add_node(split, node)

1255

self._len = self._len - old_len + len(child)

1256

self._key = None

1257

return self._search_prefix, [("", self)]

1258

1259

def _new_child(self, search_key, klass):

1260

"""Create a new child node of type klass."""

1261

child = klass()

1262

child.set_maximum_size(self._maximum_size)

1263

child._key_width = self._key_width

1264

child._search_key_func = self._search_key_func

1265

self._items[search_key] = child

1266

return child

1267

1268

def serialise(self, store):

1269

"""Serialise the node to store.

1270

1271

:param store: A VersionedFiles honouring the CHK extensions.

1272

:return: An iterable of the keys inserted by this operation.

1273

"""

1274

for node in self._items.itervalues():

1275

if type(node) is StaticTuple:

1276

# Never deserialised.

1277

continue

1278

if node._key is not None:

1279

# Never altered

1280

continue

1281

for key in node.serialise(store):

1282

yield key

1283

lines = ["chknode:\n"]

1284

lines.append("%d\n" % self._maximum_size)

1285

lines.append("%d\n" % self._key_width)

1286

lines.append("%d\n" % self._len)

1287

if self._search_prefix is None:

1288

raise AssertionError("_search_prefix should not be None")

1289

lines.append('%s\n' % (self._search_prefix,))

1290

prefix_len = len(self._search_prefix)

1291

for prefix, node in sorted(self._items.items()):

1292

if type(node) is StaticTuple:

1293

key = node[0]

1294

else:

1295

key = node._key[0]

1296

serialised = "%s\x00%s\n" % (prefix, key)

1297

if not serialised.startswith(self._search_prefix):

1298

raise AssertionError("prefixes mismatch: %s must start with %s"

1299

% (serialised, self._search_prefix))

1300

lines.append(serialised[prefix_len:])

1301

sha1, _, _ = store.add_lines((None,), (), lines)

1302

self._key = StaticTuple("sha1:" + sha1,).intern()

1303

_page_cache.add(self._key, ''.join(lines))

1304

yield self._key

1305

1306

def _search_key(self, key):

1307

"""Return the serialised key for key in this node."""

1308

# search keys are fixed width. All will be self._node_width wide, so we

1309

# pad as necessary.

1310

return (self._search_key_func(key) + '\x00'*self._node_width)[:self._node_width]

1311

1312

def _search_prefix_filter(self, key):

1313

"""Serialise key for use as a prefix filter in iteritems."""

1314

return self._search_key_func(key)[:self._node_width]

1315

1316

def _split(self, offset):

1317

"""Split this node into smaller nodes starting at offset.

1318

1319

:param offset: The offset to start the new child nodes at.

1320

:return: An iterable of (prefix, node) tuples. prefix is a byte

1321

prefix for reaching node.

1322

"""

1323

if offset >= self._node_width:

1324

for node in self._items.values():

1325

for result in node._split(offset):

1326

yield result

1327

return

1328

for key, node in self._items.items():

1329

pass

1330

1331

def refs(self):

1332

"""Return the references to other CHK's held by this node."""

1333

if self._key is None:

1334

raise AssertionError("unserialised nodes have no refs.")

1335

refs = []

1336

for value in self._items.itervalues():

1337

if type(value) is StaticTuple:

1338

refs.append(value)

1339

else:

1340

refs.append(value.key())

1341

return refs

1342

1343

def _compute_search_prefix(self, extra_key=None):

1344

"""Return the unique key prefix for this node.

1345

1346

:return: A bytestring of the longest search key prefix that is

1347

unique within this node.

1348

"""

1349

self._search_prefix = self.common_prefix_for_keys(self._items)

1350

return self._search_prefix

1351

1352

def unmap(self, store, key, check_remap=True):

1353

"""Remove key from this node and it's children."""

1354

if not len(self._items):

1355

raise AssertionError("can't unmap in an empty InternalNode.")

1356

children = [node for node, _

1357

in self._iter_nodes(store, key_filter=[key])]

1358

if children:

1359

child = children[0]

1360

else:

1361

raise KeyError(key)

1362

self._len -= 1

1363

unmapped = child.unmap(store, key)

1364

self._key = None

1365

search_key = self._search_key(key)

1366

if len(unmapped) == 0:

1367

# All child nodes are gone, remove the child:

1368

del self._items[search_key]

1369

unmapped = None

1370

else:

1371

# Stash the returned node

1372

self._items[search_key] = unmapped

1373

if len(self._items) == 1:

1374

# this node is no longer needed:

1375

return self._items.values()[0]

1376

if type(unmapped) is InternalNode:

1377

return self

1378

if check_remap:

1379

return self._check_remap(store)

1380

else:

1381

return self

1382

1383

def _check_remap(self, store):

1384

"""Check if all keys contained by children fit in a single LeafNode.

1385

1386

:param store: A store to use for reading more nodes

1387

:return: Either self, or a new LeafNode which should replace self.

1388

"""

1389

# Logic for how we determine when we need to rebuild

1390

# 1) Implicitly unmap() is removing a key which means that the child

1391

# nodes are going to be shrinking by some extent.

1392

# 2) If all children are LeafNodes, it is possible that they could be

1393

# combined into a single LeafNode, which can then completely replace

1394

# this internal node with a single LeafNode

1395

# 3) If *one* child is an InternalNode, we assume it has already done

1396

# all the work to determine that its children cannot collapse, and

1397

# we can then assume that those nodes *plus* the current nodes don't

1398

# have a chance of collapsing either.

1399

# So a very cheap check is to just say if 'unmapped' is an

1400

# InternalNode, we don't have to check further.

1401

1402

# TODO: Another alternative is to check the total size of all known

1403

# LeafNodes. If there is some formula we can use to determine the

1404

# final size without actually having to read in any more

1405

# children, it would be nice to have. However, we have to be

1406

# careful with stuff like nodes that pull out the common prefix

1407

# of each key, as adding a new key can change the common prefix

1408

# and cause size changes greater than the length of one key.

1409

# So for now, we just add everything to a new Leaf until it

1410

# splits, as we know that will give the right answer

1411

new_leaf = LeafNode(search_key_func=self._search_key_func)

1412

new_leaf.set_maximum_size(self._maximum_size)

1413

new_leaf._key_width = self._key_width

1414

# A batch_size of 16 was chosen because:

1415

# a) In testing, a 4k page held 14 times. So if we have more than 16

1416

# leaf nodes we are unlikely to hold them in a single new leaf

1417

# node. This still allows for 1 round trip

1418

# b) With 16-way fan out, we can still do a single round trip

1419

# c) With 255-way fan out, we don't want to read all 255 and destroy

1420

# the page cache, just to determine that we really don't need it.

1421

for node, _ in self._iter_nodes(store, batch_size=16):

1422

if type(node) is InternalNode:

1423

# Without looking at any leaf nodes, we are sure

1424

return self

1425

for key, value in node._items.iteritems():

1426

if new_leaf._map_no_split(key, value):

1427

return self

1428

trace.mutter("remap generated a new LeafNode")

1429

return new_leaf

1430

1431

1432

def _deserialise(bytes, key, search_key_func):

1433

"""Helper for repositorydetails - convert bytes to a node."""

1434

if bytes.startswith("chkleaf:\n"):

1435

node = LeafNode.deserialise(bytes, key, search_key_func=search_key_func)

1436

elif bytes.startswith("chknode:\n"):

1437

node = InternalNode.deserialise(bytes, key,

1438

search_key_func=search_key_func)

1439

else:

1440

raise AssertionError("Unknown node type.")

1441

return node

1442

1443

1444

class CHKMapDifference(object):

1445

"""Iterate the stored pages and key,value pairs for (new - old).

1446

1447

This class provides a generator over the stored CHK pages and the

1448

(key, value) pairs that are in any of the new maps and not in any of the

1449

old maps.

1450

1451

Note that it may yield chk pages that are common (especially root nodes),

1452

but it won't yield (key,value) pairs that are common.

1453

"""

1454

1455

def __init__(self, store, new_root_keys, old_root_keys,

1456

search_key_func, pb=None):

1457

# TODO: Should we add a StaticTuple barrier here? It would be nice to

1458

# force callers to use StaticTuple, because there will often be

1459

# lots of keys passed in here. And even if we cast it locally,

1460

# that just meanst that we will have *both* a StaticTuple and a

1461

# tuple() in memory, referring to the same object. (so a net

1462

# increase in memory, not a decrease.)

1463

self._store = store

1464

self._new_root_keys = new_root_keys

1465

self._old_root_keys = old_root_keys

1466

self._pb = pb

1467

# All uninteresting chks that we have seen. By the time they are added

1468

# here, they should be either fully ignored, or queued up for

1469

# processing

1470

self._all_old_chks = set(self._old_root_keys)

1471

# All items that we have seen from the old_root_keys

1472

self._all_old_items = set()

1473

# These are interesting items which were either read, or already in the

1474

# interesting queue (so we don't need to walk them again)

1475

self._processed_new_refs = set()

1476

self._search_key_func = search_key_func

1477

1478

# The uninteresting and interesting nodes to be searched

1479

self._old_queue = []

1480

self._new_queue = []

1481

# Holds the (key, value) items found when processing the root nodes,

1482

# waiting for the uninteresting nodes to be walked

1483

self._new_item_queue = []

1484

self._state = None

1485

1486

def _read_nodes_from_store(self, keys):

1487

# We chose not to use _page_cache, because we think in terms of records

1488

# to be yielded. Also, we expect to touch each page only 1 time during

1489

# this code. (We may want to evaluate saving the raw bytes into the

1490

# page cache, which would allow a working tree update after the fetch

1491

# to not have to read the bytes again.)

1492

stream = self._store.get_record_stream(keys, 'unordered', True)

1493

for record in stream:

1494

if self._pb is not None:

1495

self._pb.tick()

1496

if record.storage_kind == 'absent':

1497

raise errors.NoSuchRevision(self._store, record.key)

1498

bytes = record.get_bytes_as('fulltext')

1499

node = _deserialise(bytes, record.key,

1500

search_key_func=self._search_key_func)

1501

if type(node) is InternalNode:

1502

# Note we don't have to do node.refs() because we know that

1503

# there are no children that have been pushed into this node

1504

# TODO: Turn these into StaticTuple, and possibly intern them.

1505

# The sha1 pointer (in this case the value), should

1506

# already be a static tuple, and properly interned. So

1507

# i'm not sure if there is a big win on top of that

1508

prefix_refs = node._items.items()

1509

items = []

1510

else:

1511

prefix_refs = []

1512

# TODO: Turn these into StaticTuple, and possibly intern them.

1513

# This points (ST(file_id), value), which in reality

1514

# should be pretty common, because of all the leaf nodes

1515

# that share most of the entries. Note, though, that we

1516

# didn't find a benefit to interning the value, so there

1517

# may not be an actual benefit to interning this tuple.

1518

# The file_key should already be interned. If it isn't we

1519

# need to look into it.

1520

items = node._items.items()

1521

yield record, node, prefix_refs, items

1522

1523

def _read_old_roots(self):

1524

old_chks_to_enqueue = []

1525

all_old_chks = self._all_old_chks

1526

for record, node, prefix_refs, items in \

1527

self._read_nodes_from_store(self._old_root_keys):

1528

# Uninteresting node

1529

prefix_refs = [p_r for p_r in prefix_refs

1530

if p_r[1] not in all_old_chks]

1531

new_refs = [p_r[1] for p_r in prefix_refs]

1532

all_old_chks.update(new_refs)

1533

self._all_old_items.update(items)

1534

# Queue up the uninteresting references

1535

# Don't actually put them in the 'to-read' queue until we have

1536

# finished checking the interesting references

1537

old_chks_to_enqueue.extend(prefix_refs)

1538

return old_chks_to_enqueue

1539

1540

def _enqueue_old(self, new_prefixes, old_chks_to_enqueue):

1541

# At this point, we have read all the uninteresting and interesting

1542

# items, so we can queue up the uninteresting stuff, knowing that we've

1543

# handled the interesting ones

1544

for prefix, ref in old_chks_to_enqueue:

1545

not_interesting = True

1546

for i in xrange(len(prefix), 0, -1):

1547

if prefix[:i] in new_prefixes:

1548

not_interesting = False

1549

break

1550

if not_interesting:

1551

# This prefix is not part of the remaining 'interesting set'

1552

continue

1553

self._old_queue.append(ref)

1554

1555

def _read_all_roots(self):

1556

"""Read the root pages.

1557

1558

This is structured as a generator, so that the root records can be

1559

yielded up to whoever needs them without any buffering.

1560

"""

1561

# This is the bootstrap phase

1562

if not self._old_root_keys:

1563

# With no old_root_keys we can just shortcut and be ready

1564

# for _flush_new_queue

1565

self._new_queue = list(self._new_root_keys)

1566

return

1567

old_chks_to_enqueue = self._read_old_roots()

1568

# filter out any root keys that are already known to be uninteresting

1569

new_keys = set(self._new_root_keys).difference(self._all_old_chks)

1570

# These are prefixes that are present in new_keys that we are

1571

# thinking to yield

1572

new_prefixes = set()

1573

# We are about to yield all of these, so we don't want them getting

1574

# added a second time

1575

processed_new_refs = self._processed_new_refs

1576

processed_new_refs.update(new_keys)

1577

for record, node, prefix_refs, items in \

1578

self._read_nodes_from_store(new_keys):

1579

# At this level, we now know all the uninteresting references

1580

# So we filter and queue up whatever is remaining

1581

prefix_refs = [p_r for p_r in prefix_refs

1582

if p_r[1] not in self._all_old_chks

1583

and p_r[1] not in processed_new_refs]

1584

refs = [p_r[1] for p_r in prefix_refs]

1585

new_prefixes.update([p_r[0] for p_r in prefix_refs])

1586

self._new_queue.extend(refs)

1587

# TODO: We can potentially get multiple items here, however the

1588

# current design allows for this, as callers will do the work

1589

# to make the results unique. We might profile whether we

1590

# gain anything by ensuring unique return values for items

1591

new_items = [item for item in items

1592

if item not in self._all_old_items]

1593

self._new_item_queue.extend(new_items)

1594

new_prefixes.update([self._search_key_func(item[0])

1595

for item in new_items])

1596

processed_new_refs.update(refs)

1597

yield record

1598

# For new_prefixes we have the full length prefixes queued up.

1599

# However, we also need possible prefixes. (If we have a known ref to

1600

# 'ab', then we also need to include 'a'.) So expand the

1601

# new_prefixes to include all shorter prefixes

1602

for prefix in list(new_prefixes):

1603

new_prefixes.update([prefix[:i] for i in xrange(1, len(prefix))])

1604

self._enqueue_old(new_prefixes, old_chks_to_enqueue)

1605

1606

def _flush_new_queue(self):

1607

# No need to maintain the heap invariant anymore, just pull things out

1608

# and process them

1609

refs = set(self._new_queue)

1610

self._new_queue = []

1611

# First pass, flush all interesting items and convert to using direct refs

1612

all_old_chks = self._all_old_chks

1613

processed_new_refs = self._processed_new_refs

1614

all_old_items = self._all_old_items

1615

new_items = [item for item in self._new_item_queue

1616

if item not in all_old_items]

1617

self._new_item_queue = []

1618

if new_items:

1619

yield None, new_items

1620

refs = refs.difference(all_old_chks)

1621

while refs:

1622

next_refs = set()

1623

next_refs_update = next_refs.update

1624

# Inlining _read_nodes_from_store improves 'bzr branch bzr.dev'

1625

# from 1m54s to 1m51s. Consider it.

1626

for record, _, p_refs, items in self._read_nodes_from_store(refs):

1627

items = [item for item in items

1628

if item not in all_old_items]

1629

yield record, items

1630

next_refs_update([p_r[1] for p_r in p_refs])

1631

next_refs = next_refs.difference(all_old_chks)

1632

next_refs = next_refs.difference(processed_new_refs)

1633

processed_new_refs.update(next_refs)

1634

refs = next_refs

1635

1636

def _process_next_old(self):

1637

# Since we don't filter uninteresting any further than during

1638

# _read_all_roots, process the whole queue in a single pass.

1639

refs = self._old_queue

1640

self._old_queue = []

1641

all_old_chks = self._all_old_chks

1642

for record, _, prefix_refs, items in self._read_nodes_from_store(refs):

1643

self._all_old_items.update(items)

1644

refs = [r for _,r in prefix_refs if r not in all_old_chks]

1645

self._old_queue.extend(refs)

1646

all_old_chks.update(refs)

1647

1648

def _process_queues(self):

1649

while self._old_queue:

1650

self._process_next_old()

1651

return self._flush_new_queue()

1652

1653

def process(self):

1654

for record in self._read_all_roots():

1655

yield record, []

1656

for record, items in self._process_queues():

1657

yield record, items

1658

1659

1660

def iter_interesting_nodes(store, interesting_root_keys,

1661

uninteresting_root_keys, pb=None):

1662

"""Given root keys, find interesting nodes.

1663

1664

Evaluate nodes referenced by interesting_root_keys. Ones that are also

1665

referenced from uninteresting_root_keys are not considered interesting.

1666

1667

:param interesting_root_keys: keys which should be part of the

1668

"interesting" nodes (which will be yielded)

1669

:param uninteresting_root_keys: keys which should be filtered out of the

1670

result set.

1671

:return: Yield

1672

(interesting record, {interesting key:values})

1673

"""

1674

iterator = CHKMapDifference(store, interesting_root_keys,

1675

uninteresting_root_keys,

1676

search_key_func=store._search_key_func,

1677

pb=pb)

1678

return iterator.process()

1679

1680

1681

try:

1682

from bzrlib._chk_map_pyx import (

1683

_search_key_16,

1684

_search_key_255,

1685

_deserialise_leaf_node,

1686

_deserialise_internal_node,

1687

)

1688

except ImportError, e:

1689

osutils.failed_to_load_extension(e)

1690

from bzrlib._chk_map_py import (

1691

_search_key_16,

1692

_search_key_255,

1693

_deserialise_leaf_node,

1694

_deserialise_internal_node,

1695

)

1696

search_key_registry.register('hash-16-way', _search_key_16)

1697

search_key_registry.register('hash-255-way', _search_key_255)

1698

1699

1700

def _check_key(key):

1701

"""Helper function to assert that a key is properly formatted.

1702

1703

This generally shouldn't be used in production code, but it can be helpful

1704

to debug problems.

1705

"""

1706

if type(key) is not StaticTuple:

1707

raise TypeError('key %r is not StaticTuple but %s' % (key, type(key)))

1708

if len(key) != 1:

1709

raise ValueError('key %r should have length 1, not %d' % (key, len(key),))

1710

if type(key[0]) is not str:

1711

raise TypeError('key %r should hold a str, not %r'

1712

% (key, type(key[0])))

1713

if not key[0].startswith('sha1:'):

1714

raise ValueError('key %r should point to a sha1:' % (key,))

1715

1716

Older »