/brz/remove-bazaar : revision 4757

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: Canonical.com Patch Queue Manager
Date: 2009-10-19 10:59:16 UTC
mfrom: (4585.1.10 foreign-tests)
Revision ID: pqm@pqm.ubuntu.com-20091019105916-6z2jo34eqr6s0008

(Jelmer) Add infrastructure for testing foreign branch
implementations.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/history2revfiles.py

tools/http_client.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""B+Tree indices"""

import cStringIO

from bisect import bisect_right

import math

import tempfile

import zlib

from bzrlib import (

chunk_writer,

debug,

errors,

fifo_cache,

index,

lru_cache,

osutils,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

from bzrlib.transport import get_transport

_BTSIGNATURE = "B+Tree Graph Index 2\n"

_OPTION_ROW_LENGTHS = "row_lengths="

_LEAF_FLAG = "type=leaf\n"

_INTERNAL_FLAG = "type=internal\n"

_INTERNAL_OFFSET = "offset="

_RESERVED_HEADER_BYTES = 120

_PAGE_SIZE = 4096

# 4K per page: 4MB - 1000 entries

_NODE_CACHE_SIZE = 1000

class _BuilderRow(object):

"""The stored state accumulated while writing out a row in the index.

:ivar spool: A temporary file used to accumulate nodes for this row

in the tree.

:ivar nodes: The count of nodes emitted so far.

"""

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = None# tempfile.TemporaryFile(prefix='bzr-index-row-')

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

self.spool = cStringIO.StringIO()

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

elif self.nodes == 1:

# We got bigger than 1 node, switch to a temp file

spool = tempfile.TemporaryFile(prefix='bzr-index-row-')

spool.write(self.spool.getvalue())

self.spool = spool

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

skipped_bytes = padding

self.spool.writelines(byte_lines)

remainder = (self.spool.tell() + skipped_bytes) % _PAGE_SIZE

if remainder != 0:

raise AssertionError("incorrect node length: %d, %d"

% (self.spool.tell(), remainder))

self.nodes += 1

self.writer = None

class _InternalBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out internal rows."""

def finish_node(self, pad=True):

if not pad:

raise AssertionError("Must pad internal nodes only.")

_BuilderRow.finish_node(self)

100

class _LeafBuilderRow(_BuilderRow):

101

"""The stored state accumulated while writing out a leaf rows."""

102

103

104

class BTreeBuilder(index.GraphIndexBuilder):

105

"""A Builder for B+Tree based Graph indices.

106

107

The resulting graph has the structure:

108

109

_SIGNATURE OPTIONS NODES

110

_SIGNATURE := 'B+Tree Graph Index 1' NEWLINE

111

OPTIONS := REF_LISTS KEY_ELEMENTS LENGTH

112

REF_LISTS := 'node_ref_lists=' DIGITS NEWLINE

113

KEY_ELEMENTS := 'key_elements=' DIGITS NEWLINE

114

LENGTH := 'len=' DIGITS NEWLINE

115

ROW_LENGTHS := 'row_lengths' DIGITS (COMMA DIGITS)*

116

NODES := NODE_COMPRESSED*

117

NODE_COMPRESSED:= COMPRESSED_BYTES{4096}

118

NODE_RAW := INTERNAL | LEAF

119

INTERNAL := INTERNAL_FLAG POINTERS

120

LEAF := LEAF_FLAG ROWS

121

KEY_ELEMENT := Not-whitespace-utf8

122

KEY := KEY_ELEMENT (NULL KEY_ELEMENT)*

123

ROWS := ROW*

124

ROW := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

125

ABSENT := 'a'

126

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

127

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

128

REFERENCE := KEY

129

VALUE := no-newline-no-null-bytes

130

"""

131

132

def __init__(self, reference_lists=0, key_elements=1, spill_at=100000):

133

"""See GraphIndexBuilder.__init__.

134

135

:param spill_at: Optional parameter controlling the maximum number

136

of nodes that BTreeBuilder will hold in memory.

137

"""

138

index.GraphIndexBuilder.__init__(self, reference_lists=reference_lists,

139

key_elements=key_elements)

140

self._spill_at = spill_at

141

self._backing_indices = []

142

# A map of {key: (node_refs, value)}

143

self._nodes = {}

144

# Indicate it hasn't been built yet

145

self._nodes_by_key = None

146

self._optimize_for_size = False

147

148

def add_node(self, key, value, references=()):

149

"""Add a node to the index.

150

151

If adding the node causes the builder to reach its spill_at threshold,

152

disk spilling will be triggered.

153

154

:param key: The key. keys are non-empty tuples containing

155

as many whitespace-free utf8 bytestrings as the key length

156

defined for this index.

157

:param references: An iterable of iterables of keys. Each is a

158

reference to another key.

159

:param value: The value to associate with the key. It may be any

160

bytes as long as it does not contain \0 or \n.

161

"""

162

# we don't care about absent_references

163

node_refs, _ = self._check_key_ref_value(key, references, value)

164

if key in self._nodes:

165

raise errors.BadIndexDuplicateKey(key, self)

166

# TODO: StaticTuple

167

self._nodes[key] = (node_refs, value)

168

self._keys.add(key)

169

if self._nodes_by_key is not None and self._key_length > 1:

170

self._update_nodes_by_key(key, value, node_refs)

171

if len(self._keys) < self._spill_at:

172

return

173

self._spill_mem_keys_to_disk()

174

175

def _spill_mem_keys_to_disk(self):

176

"""Write the in memory keys down to disk to cap memory consumption.

177

178

If we already have some keys written to disk, we will combine them so

179

as to preserve the sorted order. The algorithm for combining uses

180

powers of two. So on the first spill, write all mem nodes into a

181

single index. On the second spill, combine the mem nodes with the nodes

182

on disk to create a 2x sized disk index and get rid of the first index.

183

On the third spill, create a single new disk index, which will contain

184

the mem nodes, and preserve the existing 2x sized index. On the fourth,

185

combine mem with the first and second indexes, creating a new one of

186

size 4x. On the fifth create a single new one, etc.

187

"""

188

if self._combine_backing_indices:

189

(new_backing_file, size,

190

backing_pos) = self._spill_mem_keys_and_combine()

191

else:

192

new_backing_file, size = self._spill_mem_keys_without_combining()

193

# Note: The transport here isn't strictly needed, because we will use

194

# direct access to the new_backing._file object

195

new_backing = BTreeGraphIndex(get_transport('.'), '<temp>', size)

196

# GC will clean up the file

197

new_backing._file = new_backing_file

198

if self._combine_backing_indices:

199

if len(self._backing_indices) == backing_pos:

200

self._backing_indices.append(None)

201

self._backing_indices[backing_pos] = new_backing

202

for backing_pos in range(backing_pos):

203

self._backing_indices[backing_pos] = None

204

else:

205

self._backing_indices.append(new_backing)

206

self._keys = set()

207

self._nodes = {}

208

self._nodes_by_key = None

209

210

def _spill_mem_keys_without_combining(self):

211

return self._write_nodes(self._iter_mem_nodes(), allow_optimize=False)

212

213

def _spill_mem_keys_and_combine(self):

214

iterators_to_combine = [self._iter_mem_nodes()]

215

pos = -1

216

for pos, backing in enumerate(self._backing_indices):

217

if backing is None:

218

pos -= 1

219

break

220

iterators_to_combine.append(backing.iter_all_entries())

221

backing_pos = pos + 1

222

new_backing_file, size = \

223

self._write_nodes(self._iter_smallest(iterators_to_combine),

224

allow_optimize=False)

225

return new_backing_file, size, backing_pos

226

227

def add_nodes(self, nodes):

228

"""Add nodes to the index.

229

230

:param nodes: An iterable of (key, node_refs, value) entries to add.

231

"""

232

if self.reference_lists:

233

for (key, value, node_refs) in nodes:

234

self.add_node(key, value, node_refs)

235

else:

236

for (key, value) in nodes:

237

self.add_node(key, value)

238

239

def _iter_mem_nodes(self):

240

"""Iterate over the nodes held in memory."""

241

nodes = self._nodes

242

if self.reference_lists:

243

for key in sorted(nodes):

244

references, value = nodes[key]

245

yield self, key, value, references

246

else:

247

for key in sorted(nodes):

248

references, value = nodes[key]

249

yield self, key, value

250

251

def _iter_smallest(self, iterators_to_combine):

252

if len(iterators_to_combine) == 1:

253

for value in iterators_to_combine[0]:

254

yield value

255

return

256

current_values = []

257

for iterator in iterators_to_combine:

258

try:

259

current_values.append(iterator.next())

260

except StopIteration:

261

current_values.append(None)

262

last = None

263

while True:

264

# Decorate candidates with the value to allow 2.4's min to be used.

265

candidates = [(item[1][1], item) for item

266

in enumerate(current_values) if item[1] is not None]

267

if not len(candidates):

268

return

269

selected = min(candidates)

270

# undecorate back to (pos, node)

271

selected = selected[1]

272

if last == selected[1][1]:

273

raise errors.BadIndexDuplicateKey(last, self)

274

last = selected[1][1]

275

# Yield, with self as the index

276

yield (self,) + selected[1][1:]

277

pos = selected[0]

278

try:

279

current_values[pos] = iterators_to_combine[pos].next()

280

except StopIteration:

281

current_values[pos] = None

282

283

def _add_key(self, string_key, line, rows, allow_optimize=True):

284

"""Add a key to the current chunk.

285

286

:param string_key: The key to add.

287

:param line: The fully serialised key and value.

288

:param allow_optimize: If set to False, prevent setting the optimize

289

flag when writing out. This is used by the _spill_mem_keys_to_disk

290

functionality.

291

"""

292

if rows[-1].writer is None:

293

# opening a new leaf chunk;

294

for pos, internal_row in enumerate(rows[:-1]):

295

# flesh out any internal nodes that are needed to

296

# preserve the height of the tree

297

if internal_row.writer is None:

298

length = _PAGE_SIZE

299

if internal_row.nodes == 0:

300

length -= _RESERVED_HEADER_BYTES # padded

301

if allow_optimize:

302

optimize_for_size = self._optimize_for_size

303

else:

304

optimize_for_size = False

305

internal_row.writer = chunk_writer.ChunkWriter(length, 0,

306

optimize_for_size=optimize_for_size)

307

internal_row.writer.write(_INTERNAL_FLAG)

308

internal_row.writer.write(_INTERNAL_OFFSET +

309

str(rows[pos + 1].nodes) + "\n")

310

# add a new leaf

311

length = _PAGE_SIZE

312

if rows[-1].nodes == 0:

313

length -= _RESERVED_HEADER_BYTES # padded

314

rows[-1].writer = chunk_writer.ChunkWriter(length,

315

optimize_for_size=self._optimize_for_size)

316

rows[-1].writer.write(_LEAF_FLAG)

317

if rows[-1].writer.write(line):

318

# this key did not fit in the node:

319

rows[-1].finish_node()

320

key_line = string_key + "\n"

321

new_row = True

322

for row in reversed(rows[:-1]):

323

# Mark the start of the next node in the node above. If it

324

# doesn't fit then propagate upwards until we find one that

325

# it does fit into.

326

if row.writer.write(key_line):

327

row.finish_node()

328

else:

329

# We've found a node that can handle the pointer.

330

new_row = False

331

break

332

# If we reached the current root without being able to mark the

333

# division point, then we need a new root:

334

if new_row:

335

# We need a new row

336

if 'index' in debug.debug_flags:

337

trace.mutter('Inserting new global row.')

338

new_row = _InternalBuilderRow()

339

reserved_bytes = 0

340

rows.insert(0, new_row)

341

# This will be padded, hence the -100

342

new_row.writer = chunk_writer.ChunkWriter(

343

_PAGE_SIZE - _RESERVED_HEADER_BYTES,

344

reserved_bytes,

345

optimize_for_size=self._optimize_for_size)

346

new_row.writer.write(_INTERNAL_FLAG)

347

new_row.writer.write(_INTERNAL_OFFSET +

348

str(rows[1].nodes - 1) + "\n")

349

new_row.writer.write(key_line)

350

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

351

352

def _write_nodes(self, node_iterator, allow_optimize=True):

353

"""Write node_iterator out as a B+Tree.

354

355

:param node_iterator: An iterator of sorted nodes. Each node should

356

match the output given by iter_all_entries.

357

:param allow_optimize: If set to False, prevent setting the optimize

358

flag when writing out. This is used by the _spill_mem_keys_to_disk

359

functionality.

360

:return: A file handle for a temporary file containing a B+Tree for

361

the nodes.

362

"""

363

# The index rows - rows[0] is the root, rows[1] is the layer under it

364

# etc.

365

rows = []

366

# forward sorted by key. In future we may consider topological sorting,

367

# at the cost of table scans for direct lookup, or a second index for

368

# direct lookup

369

key_count = 0

370

# A stack with the number of nodes of each size. 0 is the root node

371

# and must always be 1 (if there are any nodes in the tree).

372

self.row_lengths = []

373

# Loop over all nodes adding them to the bottom row

374

# (rows[-1]). When we finish a chunk in a row,

375

# propagate the key that didn't fit (comes after the chunk) to the

376

# row above, transitively.

377

for node in node_iterator:

378

if key_count == 0:

379

# First key triggers the first row

380

rows.append(_LeafBuilderRow())

381

key_count += 1

382

string_key, line = _btree_serializer._flatten_node(node,

383

self.reference_lists)

384

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

385

for row in reversed(rows):

386

pad = (type(row) != _LeafBuilderRow)

387

row.finish_node(pad=pad)

388

lines = [_BTSIGNATURE]

389

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

390

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

391

lines.append(_OPTION_LEN + str(key_count) + '\n')

392

row_lengths = [row.nodes for row in rows]

393

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

394

if row_lengths and row_lengths[-1] > 1:

395

result = tempfile.NamedTemporaryFile(prefix='bzr-index-')

396

else:

397

result = cStringIO.StringIO()

398

result.writelines(lines)

399

position = sum(map(len, lines))

400

root_row = True

401

if position > _RESERVED_HEADER_BYTES:

402

raise AssertionError("Could not fit the header in the"

403

" reserved space: %d > %d"

404

% (position, _RESERVED_HEADER_BYTES))

405

# write the rows out:

406

for row in rows:

407

reserved = _RESERVED_HEADER_BYTES # reserved space for first node

408

row.spool.flush()

409

row.spool.seek(0)

410

# copy nodes to the finalised file.

411

# Special case the first node as it may be prefixed

412

node = row.spool.read(_PAGE_SIZE)

413

result.write(node[reserved:])

414

result.write("\x00" * (reserved - position))

415

position = 0 # Only the root row actually has an offset

416

copied_len = osutils.pumpfile(row.spool, result)

417

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

418

if type(row) != _LeafBuilderRow:

419

raise AssertionError("Incorrect amount of data copied"

420

" expected: %d, got: %d"

421

% ((row.nodes - 1) * _PAGE_SIZE,

422

copied_len))

423

result.flush()

424

size = result.tell()

425

result.seek(0)

426

return result, size

427

428

def finish(self):

429

"""Finalise the index.

430

431

:return: A file handle for a temporary file containing the nodes added

432

to the index.

433

"""

434

return self._write_nodes(self.iter_all_entries())[0]

435

436

def iter_all_entries(self):

437

"""Iterate over all keys within the index

438

439

:return: An iterable of (index, key, value, reference_lists). There is

440

no defined order for the result iteration - it will be in the most

441

efficient order for the index (in this case dictionary hash order).

442

"""

443

if 'evil' in debug.debug_flags:

444

trace.mutter_callsite(3,

445

"iter_all_entries scales with size of history.")

446

# Doing serial rather than ordered would be faster; but this shouldn't

447

# be getting called routinely anyway.

448

iterators = [self._iter_mem_nodes()]

449

for backing in self._backing_indices:

450

if backing is not None:

451

iterators.append(backing.iter_all_entries())

452

if len(iterators) == 1:

453

return iterators[0]

454

return self._iter_smallest(iterators)

455

456

def iter_entries(self, keys):

457

"""Iterate over keys within the index.

458

459

:param keys: An iterable providing the keys to be retrieved.

460

:return: An iterable of (index, key, value, reference_lists). There is no

461

defined order for the result iteration - it will be in the most

462

efficient order for the index (keys iteration order in this case).

463

"""

464

keys = set(keys)

465

local_keys = keys.intersection(self._keys)

466

if self.reference_lists:

467

for key in local_keys:

468

node = self._nodes[key]

469

yield self, key, node[1], node[0]

470

else:

471

for key in local_keys:

472

node = self._nodes[key]

473

yield self, key, node[1]

474

# Find things that are in backing indices that have not been handled

475

# yet.

476

if not self._backing_indices:

477

return # We won't find anything there either

478

# Remove all of the keys that we found locally

479

keys.difference_update(local_keys)

480

for backing in self._backing_indices:

481

if backing is None:

482

continue

483

if not keys:

484

return

485

for node in backing.iter_entries(keys):

486

keys.remove(node[1])

487

yield (self,) + node[1:]

488

489

def iter_entries_prefix(self, keys):

490

"""Iterate over keys within the index using prefix matching.

491

492

Prefix matching is applied within the tuple of a key, not to within

493

the bytestring of each key element. e.g. if you have the keys ('foo',

494

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

495

only the former key is returned.

496

497

:param keys: An iterable providing the key prefixes to be retrieved.

498

Each key prefix takes the form of a tuple the length of a key, but

499

with the last N elements 'None' rather than a regular bytestring.

500

The first element cannot be 'None'.

501

:return: An iterable as per iter_all_entries, but restricted to the

502

keys with a matching prefix to those supplied. No additional keys

503

will be returned, and every match that is in the index will be

504

returned.

505

"""

506

# XXX: To much duplication with the GraphIndex class; consider finding

507

# a good place to pull out the actual common logic.

508

keys = set(keys)

509

if not keys:

510

return

511

for backing in self._backing_indices:

512

if backing is None:

513

continue

514

for node in backing.iter_entries_prefix(keys):

515

yield (self,) + node[1:]

516

if self._key_length == 1:

517

for key in keys:

518

# sanity check

519

if key[0] is None:

520

raise errors.BadIndexKey(key)

521

if len(key) != self._key_length:

522

raise errors.BadIndexKey(key)

523

try:

524

node = self._nodes[key]

525

except KeyError:

526

continue

527

if self.reference_lists:

528

yield self, key, node[1], node[0]

529

else:

530

yield self, key, node[1]

531

return

532

for key in keys:

533

# sanity check

534

if key[0] is None:

535

raise errors.BadIndexKey(key)

536

if len(key) != self._key_length:

537

raise errors.BadIndexKey(key)

538

# find what it refers to:

539

key_dict = self._get_nodes_by_key()

540

elements = list(key)

541

# find the subdict to return

542

try:

543

while len(elements) and elements[0] is not None:

544

key_dict = key_dict[elements[0]]

545

elements.pop(0)

546

except KeyError:

547

# a non-existant lookup.

548

continue

549

if len(elements):

550

dicts = [key_dict]

551

while dicts:

552

key_dict = dicts.pop(-1)

553

# can't be empty or would not exist

554

item, value = key_dict.iteritems().next()

555

if type(value) == dict:

556

# push keys

557

dicts.extend(key_dict.itervalues())

558

else:

559

# yield keys

560

for value in key_dict.itervalues():

561

yield (self, ) + value

562

else:

563

yield (self, ) + key_dict

564

565

def _get_nodes_by_key(self):

566

if self._nodes_by_key is None:

567

nodes_by_key = {}

568

if self.reference_lists:

569

for key, (references, value) in self._nodes.iteritems():

570

key_dict = nodes_by_key

571

for subkey in key[:-1]:

572

key_dict = key_dict.setdefault(subkey, {})

573

key_dict[key[-1]] = key, value, references

574

else:

575

for key, (references, value) in self._nodes.iteritems():

576

key_dict = nodes_by_key

577

for subkey in key[:-1]:

578

key_dict = key_dict.setdefault(subkey, {})

579

key_dict[key[-1]] = key, value

580

self._nodes_by_key = nodes_by_key

581

return self._nodes_by_key

582

583

def key_count(self):

584

"""Return an estimate of the number of keys in this index.

585

586

For InMemoryGraphIndex the estimate is exact.

587

"""

588

return len(self._keys) + sum(backing.key_count() for backing in

589

self._backing_indices if backing is not None)

590

591

def validate(self):

592

"""In memory index's have no known corruption at the moment."""

593

594

595

class _LeafNode(object):

596

"""A leaf node for a serialised B+Tree index."""

597

598

__slots__ = ('keys', 'min_key', 'max_key')

599

600

def __init__(self, bytes, key_length, ref_list_length):

601

"""Parse bytes to create a leaf node object."""

602

# splitlines mangles the \r delimiters.. don't use it.

603

key_list = _btree_serializer._parse_leaf_lines(bytes,

604

key_length, ref_list_length)

605

if key_list:

606

self.min_key = key_list[0][0]

607

self.max_key = key_list[-1][0]

608

else:

609

self.min_key = self.max_key = None

610

self.keys = dict(key_list)

611

612

613

class _InternalNode(object):

614

"""An internal node for a serialised B+Tree index."""

615

616

__slots__ = ('keys', 'offset')

617

618

def __init__(self, bytes):

619

"""Parse bytes to create an internal node object."""

620

# splitlines mangles the \r delimiters.. don't use it.

621

self.keys = self._parse_lines(bytes.split('\n'))

622

623

def _parse_lines(self, lines):

624

nodes = []

625

self.offset = int(lines[1][7:])

626

for line in lines[2:]:

627

if line == '':

628

break

629

# TODO: Switch to StaticTuple here.

630

nodes.append(tuple(map(intern, line.split('\0'))))

631

return nodes

632

633

634

class BTreeGraphIndex(object):

635

"""Access to nodes via the standard GraphIndex interface for B+Tree's.

636

637

Individual nodes are held in a LRU cache. This holds the root node in

638

memory except when very large walks are done.

639

"""

640

641

def __init__(self, transport, name, size, unlimited_cache=False):

642

"""Create a B+Tree index object on the index name.

643

644

:param transport: The transport to read data for the index from.

645

:param name: The file name of the index on transport.

646

:param size: Optional size of the index in bytes. This allows

647

compatibility with the GraphIndex API, as well as ensuring that

648

the initial read (to read the root node header) can be done

649

without over-reading even on empty indices, and on small indices

650

allows single-IO to read the entire index.

651

:param unlimited_cache: If set to True, then instead of using an

652

LRUCache with size _NODE_CACHE_SIZE, we will use a dict and always

653

cache all leaf nodes.

654

"""

655

self._transport = transport

656

self._name = name

657

self._size = size

658

self._file = None

659

self._recommended_pages = self._compute_recommended_pages()

660

self._root_node = None

661

# Default max size is 100,000 leave values

662

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

663

if unlimited_cache:

664

self._leaf_node_cache = {}

665

self._internal_node_cache = {}

666

else:

667

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

668

# We use a FIFO here just to prevent possible blowout. However, a

669

# 300k record btree has only 3k leaf nodes, and only 20 internal

670

# nodes. A value of 100 scales to ~100*100*100 = 1M records.

671

self._internal_node_cache = fifo_cache.FIFOCache(100)

672

self._key_count = None

673

self._row_lengths = None

674

self._row_offsets = None # Start of each row, [-1] is the end

675

676

def __eq__(self, other):

677

"""Equal when self and other were created with the same parameters."""

678

return (

679

type(self) == type(other) and

680

self._transport == other._transport and

681

self._name == other._name and

682

self._size == other._size)

683

684

def __ne__(self, other):

685

return not self.__eq__(other)

686

687

def _get_and_cache_nodes(self, nodes):

688

"""Read nodes and cache them in the lru.

689

690

The nodes list supplied is sorted and then read from disk, each node

691

being inserted it into the _node_cache.

692

693

Note: Asking for more nodes than the _node_cache can contain will

694

result in some of the results being immediately discarded, to prevent

695

this an assertion is raised if more nodes are asked for than are

696

cachable.

697

698

:return: A dict of {node_pos: node}

699

"""

700

found = {}

701

start_of_leaves = None

702

for node_pos, node in self._read_nodes(sorted(nodes)):

703

if node_pos == 0: # Special case

704

self._root_node = node

705

else:

706

if start_of_leaves is None:

707

start_of_leaves = self._row_offsets[-2]

708

if node_pos < start_of_leaves:

709

self._internal_node_cache[node_pos] = node

710

else:

711

self._leaf_node_cache[node_pos] = node

712

found[node_pos] = node

713

return found

714

715

def _compute_recommended_pages(self):

716

"""Convert transport's recommended_page_size into btree pages.

717

718

recommended_page_size is in bytes, we want to know how many _PAGE_SIZE

719

pages fit in that length.

720

"""

721

recommended_read = self._transport.recommended_page_size()

722

recommended_pages = int(math.ceil(recommended_read /

723

float(_PAGE_SIZE)))

724

return recommended_pages

725

726

def _compute_total_pages_in_index(self):

727

"""How many pages are in the index.

728

729

If we have read the header we will use the value stored there.

730

Otherwise it will be computed based on the length of the index.

731

"""

732

if self._size is None:

733

raise AssertionError('_compute_total_pages_in_index should not be'

734

' called when self._size is None')

735

if self._root_node is not None:

736

# This is the number of pages as defined by the header

737

return self._row_offsets[-1]

738

# This is the number of pages as defined by the size of the index. They

739

# should be indentical.

740

total_pages = int(math.ceil(self._size / float(_PAGE_SIZE)))

741

return total_pages

742

743

def _expand_offsets(self, offsets):

744

"""Find extra pages to download.

745

746

The idea is that we always want to make big-enough requests (like 64kB

747

for http), so that we don't waste round trips. So given the entries

748

that we already have cached and the new pages being downloaded figure

749

out what other pages we might want to read.

750

751

See also doc/developers/btree_index_prefetch.txt for more details.

752

753

:param offsets: The offsets to be read

754

:return: A list of offsets to download

755

"""

756

if 'index' in debug.debug_flags:

757

trace.mutter('expanding: %s\toffsets: %s', self._name, offsets)

758

759

if len(offsets) >= self._recommended_pages:

760

# Don't add more, we are already requesting more than enough

761

if 'index' in debug.debug_flags:

762

trace.mutter(' not expanding large request (%s >= %s)',

763

len(offsets), self._recommended_pages)

764

return offsets

765

if self._size is None:

766

# Don't try anything, because we don't know where the file ends

767

if 'index' in debug.debug_flags:

768

trace.mutter(' not expanding without knowing index size')

769

return offsets

770

total_pages = self._compute_total_pages_in_index()

771

cached_offsets = self._get_offsets_to_cached_pages()

772

# If reading recommended_pages would read the rest of the index, just

773

# do so.

774

if total_pages - len(cached_offsets) <= self._recommended_pages:

775

# Read whatever is left

776

if cached_offsets:

777

expanded = [x for x in xrange(total_pages)

778

if x not in cached_offsets]

779

else:

780

expanded = range(total_pages)

781

if 'index' in debug.debug_flags:

782

trace.mutter(' reading all unread pages: %s', expanded)

783

return expanded

784

785

if self._root_node is None:

786

# ATM on the first read of the root node of a large index, we don't

787

# bother pre-reading any other pages. This is because the

788

# likelyhood of actually reading interesting pages is very low.

789

# See doc/developers/btree_index_prefetch.txt for a discussion, and

790

# a possible implementation when we are guessing that the second

791

# layer index is small

792

final_offsets = offsets

793

else:

794

tree_depth = len(self._row_lengths)

795

if len(cached_offsets) < tree_depth and len(offsets) == 1:

796

# We haven't read enough to justify expansion

797

# If we are only going to read the root node, and 1 leaf node,

798

# then it isn't worth expanding our request. Once we've read at

799

# least 2 nodes, then we are probably doing a search, and we

800

# start expanding our requests.

801

if 'index' in debug.debug_flags:

802

trace.mutter(' not expanding on first reads')

803

return offsets

804

final_offsets = self._expand_to_neighbors(offsets, cached_offsets,

805

total_pages)

806

807

final_offsets = sorted(final_offsets)

808

if 'index' in debug.debug_flags:

809

trace.mutter('expanded: %s', final_offsets)

810

return final_offsets

811

812

def _expand_to_neighbors(self, offsets, cached_offsets, total_pages):

813

"""Expand requests to neighbors until we have enough pages.

814

815

This is called from _expand_offsets after policy has determined that we

816

want to expand.

817

We only want to expand requests within a given layer. We cheat a little

818

bit and assume all requests will be in the same layer. This is true

819

given the current design, but if it changes this algorithm may perform

820

oddly.

821

822

:param offsets: requested offsets

823

:param cached_offsets: offsets for pages we currently have cached

824

:return: A set() of offsets after expansion

825

"""

826

final_offsets = set(offsets)

827

first = end = None

828

new_tips = set(final_offsets)

829

while len(final_offsets) < self._recommended_pages and new_tips:

830

next_tips = set()

831

for pos in new_tips:

832

if first is None:

833

first, end = self._find_layer_first_and_end(pos)

834

previous = pos - 1

835

if (previous > 0

836

and previous not in cached_offsets

837

and previous not in final_offsets

838

and previous >= first):

839

next_tips.add(previous)

840

after = pos + 1

841

if (after < total_pages

842

and after not in cached_offsets

843

and after not in final_offsets

844

and after < end):

845

next_tips.add(after)

846

# This would keep us from going bigger than

847

# recommended_pages by only expanding the first offsets.

848

# However, if we are making a 'wide' request, it is

849

# reasonable to expand all points equally.

850

# if len(final_offsets) > recommended_pages:

851

# break

852

final_offsets.update(next_tips)

853

new_tips = next_tips

854

return final_offsets

855

856

def external_references(self, ref_list_num):

857

if self._root_node is None:

858

self._get_root_node()

859

if ref_list_num + 1 > self.node_ref_lists:

860

raise ValueError('No ref list %d, index has %d ref lists'

861

% (ref_list_num, self.node_ref_lists))

862

keys = set()

863

refs = set()

864

for node in self.iter_all_entries():

865

keys.add(node[1])

866

refs.update(node[3][ref_list_num])

867

return refs - keys

868

869

def _find_layer_first_and_end(self, offset):

870

"""Find the start/stop nodes for the layer corresponding to offset.

871

872

:return: (first, end)

873

first is the first node in this layer

874

end is the first node of the next layer

875

"""

876

first = end = 0

877

for roffset in self._row_offsets:

878

first = end

879

end = roffset

880

if offset < roffset:

881

break

882

return first, end

883

884

def _get_offsets_to_cached_pages(self):

885

"""Determine what nodes we already have cached."""

886

cached_offsets = set(self._internal_node_cache.keys())

887

cached_offsets.update(self._leaf_node_cache.keys())

888

if self._root_node is not None:

889

cached_offsets.add(0)

890

return cached_offsets

891

892

def _get_root_node(self):

893

if self._root_node is None:

894

# We may not have a root node yet

895

self._get_internal_nodes([0])

896

return self._root_node

897

898

def _get_nodes(self, cache, node_indexes):

899

found = {}

900

needed = []

901

for idx in node_indexes:

902

if idx == 0 and self._root_node is not None:

903

found[0] = self._root_node

904

continue

905

try:

906

found[idx] = cache[idx]

907

except KeyError:

908

needed.append(idx)

909

if not needed:

910

return found

911

needed = self._expand_offsets(needed)

912

found.update(self._get_and_cache_nodes(needed))

913

return found

914

915

def _get_internal_nodes(self, node_indexes):

916

"""Get a node, from cache or disk.

917

918

After getting it, the node will be cached.

919

"""

920

return self._get_nodes(self._internal_node_cache, node_indexes)

921

922

def _cache_leaf_values(self, nodes):

923

"""Cache directly from key => value, skipping the btree."""

924

if self._leaf_value_cache is not None:

925

for node in nodes.itervalues():

926

for key, value in node.keys.iteritems():

927

if key in self._leaf_value_cache:

928

# Don't add the rest of the keys, we've seen this node

929

# before.

930

break

931

self._leaf_value_cache[key] = value

932

933

def _get_leaf_nodes(self, node_indexes):

934

"""Get a bunch of nodes, from cache or disk."""

935

found = self._get_nodes(self._leaf_node_cache, node_indexes)

936

self._cache_leaf_values(found)

937

return found

938

939

def iter_all_entries(self):

940

"""Iterate over all keys within the index.

941

942

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

943

The former tuple is used when there are no reference lists in the

944

index, making the API compatible with simple key:value index types.

945

There is no defined order for the result iteration - it will be in

946

the most efficient order for the index.

947

"""

948

if 'evil' in debug.debug_flags:

949

trace.mutter_callsite(3,

950

"iter_all_entries scales with size of history.")

951

if not self.key_count():

952

return

953

if self._row_offsets[-1] == 1:

954

# There is only the root node, and we read that via key_count()

955

if self.node_ref_lists:

956

for key, (value, refs) in sorted(self._root_node.keys.items()):

957

yield (self, key, value, refs)

958

else:

959

for key, (value, refs) in sorted(self._root_node.keys.items()):

960

yield (self, key, value)

961

return

962

start_of_leaves = self._row_offsets[-2]

963

end_of_leaves = self._row_offsets[-1]

964

needed_offsets = range(start_of_leaves, end_of_leaves)

965

if needed_offsets == [0]:

966

# Special case when we only have a root node, as we have already

967

# read everything

968

nodes = [(0, self._root_node)]

969

else:

970

nodes = self._read_nodes(needed_offsets)

971

# We iterate strictly in-order so that we can use this function

972

# for spilling index builds to disk.

973

if self.node_ref_lists:

974

for _, node in nodes:

975

for key, (value, refs) in sorted(node.keys.items()):

976

yield (self, key, value, refs)

977

else:

978

for _, node in nodes:

979

for key, (value, refs) in sorted(node.keys.items()):

980

yield (self, key, value)

981

982

@staticmethod

983

def _multi_bisect_right(in_keys, fixed_keys):

984

"""Find the positions where each 'in_key' would fit in fixed_keys.

985

986

This is equivalent to doing "bisect_right" on each in_key into

987

fixed_keys

988

989

:param in_keys: A sorted list of keys to match with fixed_keys

990

:param fixed_keys: A sorted list of keys to match against

991

:return: A list of (integer position, [key list]) tuples.

992

"""

993

if not in_keys:

994

return []

995

if not fixed_keys:

996

# no pointers in the fixed_keys list, which means everything must

997

# fall to the left.

998

return [(0, in_keys)]

999

1000

# TODO: Iterating both lists will generally take M + N steps

1001

# Bisecting each key will generally take M * log2 N steps.

1002

# If we had an efficient way to compare, we could pick the method

1003

# based on which has the fewer number of steps.

1004

# There is also the argument that bisect_right is a compiled

1005

# function, so there is even more to be gained.

1006

# iter_steps = len(in_keys) + len(fixed_keys)

1007

# bisect_steps = len(in_keys) * math.log(len(fixed_keys), 2)

1008

if len(in_keys) == 1: # Bisect will always be faster for M = 1

1009

return [(bisect_right(fixed_keys, in_keys[0]), in_keys)]

1010

# elif bisect_steps < iter_steps:

1011

# offsets = {}

1012

# for key in in_keys:

1013

# offsets.setdefault(bisect_right(fixed_keys, key),

1014

# []).append(key)

1015

# return [(o, offsets[o]) for o in sorted(offsets)]

1016

in_keys_iter = iter(in_keys)

1017

fixed_keys_iter = enumerate(fixed_keys)

1018

cur_in_key = in_keys_iter.next()

1019

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1020

1021

class InputDone(Exception): pass

1022

class FixedDone(Exception): pass

1023

1024

output = []

1025

cur_out = []

1026

1027

# TODO: Another possibility is that rather than iterating on each side,

1028

# we could use a combination of bisecting and iterating. For

1029

# example, while cur_in_key < fixed_key, bisect to find its

1030

# point, then iterate all matching keys, then bisect (restricted

1031

# to only the remainder) for the next one, etc.

1032

try:

1033

while True:

1034

if cur_in_key < cur_fixed_key:

1035

cur_keys = []

1036

cur_out = (cur_fixed_offset, cur_keys)

1037

output.append(cur_out)

1038

while cur_in_key < cur_fixed_key:

1039

cur_keys.append(cur_in_key)

1040

try:

1041

cur_in_key = in_keys_iter.next()

1042

except StopIteration:

1043

raise InputDone

1044

# At this point cur_in_key must be >= cur_fixed_key

1045

# step the cur_fixed_key until we pass the cur key, or walk off

1046

# the end

1047

while cur_in_key >= cur_fixed_key:

1048

try:

1049

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1050

except StopIteration:

1051

raise FixedDone

1052

except InputDone:

1053

# We consumed all of the input, nothing more to do

1054

pass

1055

except FixedDone:

1056

# There was some input left, but we consumed all of fixed, so we

1057

# have to add one more for the tail

1058

cur_keys = [cur_in_key]

1059

cur_keys.extend(in_keys_iter)

1060

cur_out = (len(fixed_keys), cur_keys)

1061

output.append(cur_out)

1062

return output

1063

1064

def _walk_through_internal_nodes(self, keys):

1065

"""Take the given set of keys, and find the corresponding LeafNodes.

1066

1067

:param keys: An unsorted iterable of keys to search for

1068

:return: (nodes, index_and_keys)

1069

nodes is a dict mapping {index: LeafNode}

1070

keys_at_index is a list of tuples of [(index, [keys for Leaf])]

1071

"""

1072

# 6 seconds spent in miss_torture using the sorted() line.

1073

# Even with out of order disk IO it seems faster not to sort it when

1074

# large queries are being made.

1075

keys_at_index = [(0, sorted(keys))]

1076

1077

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1078

node_indexes = [idx for idx, s_keys in keys_at_index]

1079

nodes = self._get_internal_nodes(node_indexes)

1080

1081

next_nodes_and_keys = []

1082

for node_index, sub_keys in keys_at_index:

1083

node = nodes[node_index]

1084

positions = self._multi_bisect_right(sub_keys, node.keys)

1085

node_offset = next_row_start + node.offset

1086

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1087

for pos, s_keys in positions])

1088

keys_at_index = next_nodes_and_keys

1089

# We should now be at the _LeafNodes

1090

node_indexes = [idx for idx, s_keys in keys_at_index]

1091

1092

# TODO: We may *not* want to always read all the nodes in one

1093

# big go. Consider setting a max size on this.

1094

nodes = self._get_leaf_nodes(node_indexes)

1095

return nodes, keys_at_index

1096

1097

def iter_entries(self, keys):

1098

"""Iterate over keys within the index.

1099

1100

:param keys: An iterable providing the keys to be retrieved.

1101

:return: An iterable as per iter_all_entries, but restricted to the

1102

keys supplied. No additional keys will be returned, and every

1103

key supplied that is in the index will be returned.

1104

"""

1105

# 6 seconds spent in miss_torture using the sorted() line.

1106

# Even with out of order disk IO it seems faster not to sort it when

1107

# large queries are being made.

1108

# However, now that we are doing multi-way bisecting, we need the keys

1109

# in sorted order anyway. We could change the multi-way code to not

1110

# require sorted order. (For example, it bisects for the first node,

1111

# does an in-order search until a key comes before the current point,

1112

# which it then bisects for, etc.)

1113

keys = frozenset(keys)

1114

if not keys:

1115

return

1116

1117

if not self.key_count():

1118

return

1119

1120

needed_keys = []

1121

if self._leaf_value_cache is None:

1122

needed_keys = keys

1123

else:

1124

for key in keys:

1125

value = self._leaf_value_cache.get(key, None)

1126

if value is not None:

1127

# This key is known not to be here, skip it

1128

value, refs = value

1129

if self.node_ref_lists:

1130

yield (self, key, value, refs)

1131

else:

1132

yield (self, key, value)

1133

else:

1134

needed_keys.append(key)

1135

1136

last_key = None

1137

needed_keys = keys

1138

if not needed_keys:

1139

return

1140

nodes, nodes_and_keys = self._walk_through_internal_nodes(needed_keys)

1141

for node_index, sub_keys in nodes_and_keys:

1142

if not sub_keys:

1143

continue

1144

node = nodes[node_index]

1145

for next_sub_key in sub_keys:

1146

if next_sub_key in node.keys:

1147

value, refs = node.keys[next_sub_key]

1148

if self.node_ref_lists:

1149

yield (self, next_sub_key, value, refs)

1150

else:

1151

yield (self, next_sub_key, value)

1152

1153

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

1154

"""Find the parent_map information for the set of keys.

1155

1156

This populates the parent_map dict and missing_keys set based on the

1157

queried keys. It also can fill out an arbitrary number of parents that

1158

it finds while searching for the supplied keys.

1159

1160

It is unlikely that you want to call this directly. See

1161

"CombinedGraphIndex.find_ancestry()" for a more appropriate API.

1162

1163

:param keys: A keys whose ancestry we want to return

1164

Every key will either end up in 'parent_map' or 'missing_keys'.

1165

:param ref_list_num: This index in the ref_lists is the parents we

1166

care about.

1167

:param parent_map: {key: parent_keys} for keys that are present in this

1168

index. This may contain more entries than were in 'keys', that are

1169

reachable ancestors of the keys requested.

1170

:param missing_keys: keys which are known to be missing in this index.

1171

This may include parents that were not directly requested, but we

1172

were able to determine that they are not present in this index.

1173

:return: search_keys parents that were found but not queried to know

1174

if they are missing or present. Callers can re-query this index for

1175

those keys, and they will be placed into parent_map or missing_keys

1176

"""

1177

if not self.key_count():

1178

# We use key_count() to trigger reading the root node and

1179

# determining info about this BTreeGraphIndex

1180

# If we don't have any keys, then everything is missing

1181

missing_keys.update(keys)

1182

return set()

1183

if ref_list_num >= self.node_ref_lists:

1184

raise ValueError('No ref list %d, index has %d ref lists'

1185

% (ref_list_num, self.node_ref_lists))

1186

1187

# The main trick we are trying to accomplish is that when we find a

1188

# key listing its parents, we expect that the parent key is also likely

1189

# to sit on the same page. Allowing us to expand parents quickly

1190

# without suffering the full stack of bisecting, etc.

1191

nodes, nodes_and_keys = self._walk_through_internal_nodes(keys)

1192

1193

# These are parent keys which could not be immediately resolved on the

1194

# page where the child was present. Note that we may already be

1195

# searching for that key, and it may actually be present [or known

1196

# missing] on one of the other pages we are reading.

1197

# TODO:

1198

# We could try searching for them in the immediate previous or next

1199

# page. If they occur "later" we could put them in a pending lookup

1200

# set, and then for each node we read thereafter we could check to

1201

# see if they are present.

1202

# However, we don't know the impact of keeping this list of things

1203

# that I'm going to search for every node I come across from here on

1204

# out.

1205

# It doesn't handle the case when the parent key is missing on a

1206

# page that we *don't* read. So we already have to handle being

1207

# re-entrant for that.

1208

# Since most keys contain a date string, they are more likely to be

1209

# found earlier in the file than later, but we would know that right

1210

# away (key < min_key), and wouldn't keep searching it on every other

1211

# page that we read.

1212

# Mostly, it is an idea, one which should be benchmarked.

1213

parents_not_on_page = set()

1214

1215

for node_index, sub_keys in nodes_and_keys:

1216

if not sub_keys:

1217

continue

1218

# sub_keys is all of the keys we are looking for that should exist

1219

# on this page, if they aren't here, then they won't be found

1220

node = nodes[node_index]

1221

node_keys = node.keys

1222

parents_to_check = set()

1223

for next_sub_key in sub_keys:

1224

if next_sub_key not in node_keys:

1225

# This one is just not present in the index at all

1226

missing_keys.add(next_sub_key)

1227

else:

1228

value, refs = node_keys[next_sub_key]

1229

parent_keys = refs[ref_list_num]

1230

parent_map[next_sub_key] = parent_keys

1231

parents_to_check.update(parent_keys)

1232

# Don't look for things we've already found

1233

parents_to_check = parents_to_check.difference(parent_map)

1234

# this can be used to test the benefit of having the check loop

1235

# inlined.

1236

# parents_not_on_page.update(parents_to_check)

1237

# continue

1238

while parents_to_check:

1239

next_parents_to_check = set()

1240

for key in parents_to_check:

1241

if key in node_keys:

1242

value, refs = node_keys[key]

1243

parent_keys = refs[ref_list_num]

1244

parent_map[key] = parent_keys

1245

next_parents_to_check.update(parent_keys)

1246

else:

1247

# This parent either is genuinely missing, or should be

1248

# found on another page. Perf test whether it is better

1249

# to check if this node should fit on this page or not.

1250

# in the 'everything-in-one-pack' scenario, this *not*

1251

# doing the check is 237ms vs 243ms.

1252

# So slightly better, but I assume the standard 'lots

1253

# of packs' is going to show a reasonable improvement

1254

# from the check, because it avoids 'going around

1255

# again' for everything that is in another index

1256

# parents_not_on_page.add(key)

1257

# Missing for some reason

1258

if key < node.min_key:

1259

# in the case of bzr.dev, 3.4k/5.3k misses are

1260

# 'earlier' misses (65%)

1261

parents_not_on_page.add(key)

1262

elif key > node.max_key:

1263

# This parent key would be present on a different

1264

# LeafNode

1265

parents_not_on_page.add(key)

1266

else:

1267

# assert key != node.min_key and key != node.max_key

1268

# If it was going to be present, it would be on

1269

# *this* page, so mark it missing.

1270

missing_keys.add(key)

1271

parents_to_check = next_parents_to_check.difference(parent_map)

1272

# Might want to do another .difference() from missing_keys

1273

# parents_not_on_page could have been found on a different page, or be

1274

# known to be missing. So cull out everything that has already been

1275

# found.

1276

search_keys = parents_not_on_page.difference(

1277

parent_map).difference(missing_keys)

1278

return search_keys

1279

1280

def iter_entries_prefix(self, keys):

1281

"""Iterate over keys within the index using prefix matching.

1282

1283

Prefix matching is applied within the tuple of a key, not to within

1284

the bytestring of each key element. e.g. if you have the keys ('foo',

1285

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1286

only the former key is returned.

1287

1288

WARNING: Note that this method currently causes a full index parse

1289

unconditionally (which is reasonably appropriate as it is a means for

1290

thunking many small indices into one larger one and still supplies

1291

iter_all_entries at the thunk layer).

1292

1293

:param keys: An iterable providing the key prefixes to be retrieved.

1294

Each key prefix takes the form of a tuple the length of a key, but

1295

with the last N elements 'None' rather than a regular bytestring.

1296

The first element cannot be 'None'.

1297

:return: An iterable as per iter_all_entries, but restricted to the

1298

keys with a matching prefix to those supplied. No additional keys

1299

will be returned, and every match that is in the index will be

1300

returned.

1301

"""

1302

keys = sorted(set(keys))

1303

if not keys:

1304

return

1305

# Load if needed to check key lengths

1306

if self._key_count is None:

1307

self._get_root_node()

1308

# TODO: only access nodes that can satisfy the prefixes we are looking

1309

# for. For now, to meet API usage (as this function is not used by

1310

# current bzrlib) just suck the entire index and iterate in memory.

1311

nodes = {}

1312

if self.node_ref_lists:

1313

if self._key_length == 1:

1314

for _1, key, value, refs in self.iter_all_entries():

1315

nodes[key] = value, refs

1316

else:

1317

nodes_by_key = {}

1318

for _1, key, value, refs in self.iter_all_entries():

1319

key_value = key, value, refs

1320

# For a key of (foo, bar, baz) create

1321

# _nodes_by_key[foo][bar][baz] = key_value

1322

key_dict = nodes_by_key

1323

for subkey in key[:-1]:

1324

key_dict = key_dict.setdefault(subkey, {})

1325

key_dict[key[-1]] = key_value

1326

else:

1327

if self._key_length == 1:

1328

for _1, key, value in self.iter_all_entries():

1329

nodes[key] = value

1330

else:

1331

nodes_by_key = {}

1332

for _1, key, value in self.iter_all_entries():

1333

key_value = key, value

1334

# For a key of (foo, bar, baz) create

1335

# _nodes_by_key[foo][bar][baz] = key_value

1336

key_dict = nodes_by_key

1337

for subkey in key[:-1]:

1338

key_dict = key_dict.setdefault(subkey, {})

1339

key_dict[key[-1]] = key_value

1340

if self._key_length == 1:

1341

for key in keys:

1342

# sanity check

1343

if key[0] is None:

1344

raise errors.BadIndexKey(key)

1345

if len(key) != self._key_length:

1346

raise errors.BadIndexKey(key)

1347

try:

1348

if self.node_ref_lists:

1349

value, node_refs = nodes[key]

1350

yield self, key, value, node_refs

1351

else:

1352

yield self, key, nodes[key]

1353

except KeyError:

1354

pass

1355

return

1356

for key in keys:

1357

# sanity check

1358

if key[0] is None:

1359

raise errors.BadIndexKey(key)

1360

if len(key) != self._key_length:

1361

raise errors.BadIndexKey(key)

1362

# find what it refers to:

1363

key_dict = nodes_by_key

1364

elements = list(key)

1365

# find the subdict whose contents should be returned.

1366

try:

1367

while len(elements) and elements[0] is not None:

1368

key_dict = key_dict[elements[0]]

1369

elements.pop(0)

1370

except KeyError:

1371

# a non-existant lookup.

1372

continue

1373

if len(elements):

1374

dicts = [key_dict]

1375

while dicts:

1376

key_dict = dicts.pop(-1)

1377

# can't be empty or would not exist

1378

item, value = key_dict.iteritems().next()

1379

if type(value) == dict:

1380

# push keys

1381

dicts.extend(key_dict.itervalues())

1382

else:

1383

# yield keys

1384

for value in key_dict.itervalues():

1385

# each value is the key:value:node refs tuple

1386

# ready to yield.

1387

yield (self, ) + value

1388

else:

1389

# the last thing looked up was a terminal element

1390

yield (self, ) + key_dict

1391

1392

def key_count(self):

1393

"""Return an estimate of the number of keys in this index.

1394

1395

For BTreeGraphIndex the estimate is exact as it is contained in the

1396

header.

1397

"""

1398

if self._key_count is None:

1399

self._get_root_node()

1400

return self._key_count

1401

1402

def _compute_row_offsets(self):

1403

"""Fill out the _row_offsets attribute based on _row_lengths."""

1404

offsets = []

1405

row_offset = 0

1406

for row in self._row_lengths:

1407

offsets.append(row_offset)

1408

row_offset += row

1409

offsets.append(row_offset)

1410

self._row_offsets = offsets

1411

1412

def _parse_header_from_bytes(self, bytes):

1413

"""Parse the header from a region of bytes.

1414

1415

:param bytes: The data to parse.

1416

:return: An offset, data tuple such as readv yields, for the unparsed

1417

data. (which may be of length 0).

1418

"""

1419

signature = bytes[0:len(self._signature())]

1420

if not signature == self._signature():

1421

raise errors.BadIndexFormatSignature(self._name, BTreeGraphIndex)

1422

lines = bytes[len(self._signature()):].splitlines()

1423

options_line = lines[0]

1424

if not options_line.startswith(_OPTION_NODE_REFS):

1425

raise errors.BadIndexOptions(self)

1426

try:

1427

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

1428

except ValueError:

1429

raise errors.BadIndexOptions(self)

1430

options_line = lines[1]

1431

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

1432

raise errors.BadIndexOptions(self)

1433

try:

1434

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

1435

except ValueError:

1436

raise errors.BadIndexOptions(self)

1437

options_line = lines[2]

1438

if not options_line.startswith(_OPTION_LEN):

1439

raise errors.BadIndexOptions(self)

1440

try:

1441

self._key_count = int(options_line[len(_OPTION_LEN):])

1442

except ValueError:

1443

raise errors.BadIndexOptions(self)

1444

options_line = lines[3]

1445

if not options_line.startswith(_OPTION_ROW_LENGTHS):

1446

raise errors.BadIndexOptions(self)

1447

try:

1448

self._row_lengths = map(int, [length for length in

1449

options_line[len(_OPTION_ROW_LENGTHS):].split(',')

1450

if len(length)])

1451

except ValueError:

1452

raise errors.BadIndexOptions(self)

1453

self._compute_row_offsets()

1454

1455

# calculate the bytes we have processed

1456

header_end = (len(signature) + sum(map(len, lines[0:4])) + 4)

1457

return header_end, bytes[header_end:]

1458

1459

def _read_nodes(self, nodes):

1460

"""Read some nodes from disk into the LRU cache.

1461

1462

This performs a readv to get the node data into memory, and parses each

1463

node, then yields it to the caller. The nodes are requested in the

1464

supplied order. If possible doing sort() on the list before requesting

1465

a read may improve performance.

1466

1467

:param nodes: The nodes to read. 0 - first node, 1 - second node etc.

1468

:return: None

1469

"""

1470

# may be the byte string of the whole file

1471

bytes = None

1472

# list of (offset, length) regions of the file that should, evenually

1473

# be read in to data_ranges, either from 'bytes' or from the transport

1474

ranges = []

1475

for index in nodes:

1476

offset = index * _PAGE_SIZE

1477

size = _PAGE_SIZE

1478

if index == 0:

1479

# Root node - special case

1480

if self._size:

1481

size = min(_PAGE_SIZE, self._size)

1482

else:

1483

# The only case where we don't know the size, is for very

1484

# small indexes. So we read the whole thing

1485

bytes = self._transport.get_bytes(self._name)

1486

self._size = len(bytes)

1487

# the whole thing should be parsed out of 'bytes'

1488

ranges.append((0, len(bytes)))

1489

break

1490

else:

1491

if offset > self._size:

1492

raise AssertionError('tried to read past the end'

1493

' of the file %s > %s'

1494

% (offset, self._size))

1495

size = min(size, self._size - offset)

1496

ranges.append((offset, size))

1497

if not ranges:

1498

return

1499

elif bytes is not None:

1500

# already have the whole file

1501

data_ranges = [(start, bytes[start:start+_PAGE_SIZE])

1502

for start in xrange(0, len(bytes), _PAGE_SIZE)]

1503

elif self._file is None:

1504

data_ranges = self._transport.readv(self._name, ranges)

1505

else:

1506

data_ranges = []

1507

for offset, size in ranges:

1508

self._file.seek(offset)

1509

data_ranges.append((offset, self._file.read(size)))

1510

for offset, data in data_ranges:

1511

if offset == 0:

1512

# extract the header

1513

offset, data = self._parse_header_from_bytes(data)

1514

if len(data) == 0:

1515

continue

1516

bytes = zlib.decompress(data)

1517

if bytes.startswith(_LEAF_FLAG):

1518

node = _LeafNode(bytes, self._key_length, self.node_ref_lists)

1519

elif bytes.startswith(_INTERNAL_FLAG):

1520

node = _InternalNode(bytes)

1521

else:

1522

raise AssertionError("Unknown node type for %r" % bytes)

1523

yield offset / _PAGE_SIZE, node

1524

1525

def _signature(self):

1526

"""The file signature for this index type."""

1527

return _BTSIGNATURE

1528

1529

def validate(self):

1530

"""Validate that everything in the index can be accessed."""

1531

# just read and parse every node.

1532

self._get_root_node()

1533

if len(self._row_lengths) > 1:

1534

start_node = self._row_offsets[1]

1535

else:

1536

# We shouldn't be reading anything anyway

1537

start_node = 1

1538

node_end = self._row_offsets[-1]

1539

for node in self._read_nodes(range(start_node, node_end)):

1540

pass

1541

1542

1543

try:

1544

from bzrlib import _btree_serializer_pyx as _btree_serializer

1545

except ImportError, e:

1546

osutils.failed_to_load_extension(e)

1547

from bzrlib import _btree_serializer_py as _btree_serializer

Older »