/brz/remove-bazaar : revision 4744.2.7

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: John Arbash Meinel
Date: 2009-10-19 15:45:10 UTC
mto: This revision was merged to the branch mainline in revision 4758.
Revision ID: john@arbash-meinel.com-20091019154510-tr02ifha84pmo3zh

Add .clear_cache() members to GraphIndexBuilder and BTreeBuilder.

Update GroupCompressVersionedFiles.clear_cache() to clear the graph index's caches.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/history2revfiles.py

tools/http_client.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""B+Tree indices"""

import cStringIO

from bisect import bisect_right

import math

import tempfile

import zlib

from bzrlib import (

chunk_writer,

debug,

errors,

fifo_cache,

index,

lru_cache,

osutils,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

from bzrlib.transport import get_transport

_BTSIGNATURE = "B+Tree Graph Index 2\n"

_OPTION_ROW_LENGTHS = "row_lengths="

_LEAF_FLAG = "type=leaf\n"

_INTERNAL_FLAG = "type=internal\n"

_INTERNAL_OFFSET = "offset="

_RESERVED_HEADER_BYTES = 120

_PAGE_SIZE = 4096

# 4K per page: 4MB - 1000 entries

_NODE_CACHE_SIZE = 1000

class _BuilderRow(object):

"""The stored state accumulated while writing out a row in the index.

:ivar spool: A temporary file used to accumulate nodes for this row

in the tree.

:ivar nodes: The count of nodes emitted so far.

"""

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = None# tempfile.TemporaryFile(prefix='bzr-index-row-')

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

self.spool = cStringIO.StringIO()

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

elif self.nodes == 1:

# We got bigger than 1 node, switch to a temp file

spool = tempfile.TemporaryFile(prefix='bzr-index-row-')

spool.write(self.spool.getvalue())

self.spool = spool

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

skipped_bytes = padding

self.spool.writelines(byte_lines)

remainder = (self.spool.tell() + skipped_bytes) % _PAGE_SIZE

if remainder != 0:

raise AssertionError("incorrect node length: %d, %d"

% (self.spool.tell(), remainder))

self.nodes += 1

self.writer = None

class _InternalBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out internal rows."""

def finish_node(self, pad=True):

if not pad:

raise AssertionError("Must pad internal nodes only.")

_BuilderRow.finish_node(self)

100

class _LeafBuilderRow(_BuilderRow):

101

"""The stored state accumulated while writing out a leaf rows."""

102

103

104

class BTreeBuilder(index.GraphIndexBuilder):

105

"""A Builder for B+Tree based Graph indices.

106

107

The resulting graph has the structure:

108

109

_SIGNATURE OPTIONS NODES

110

_SIGNATURE := 'B+Tree Graph Index 1' NEWLINE

111

OPTIONS := REF_LISTS KEY_ELEMENTS LENGTH

112

REF_LISTS := 'node_ref_lists=' DIGITS NEWLINE

113

KEY_ELEMENTS := 'key_elements=' DIGITS NEWLINE

114

LENGTH := 'len=' DIGITS NEWLINE

115

ROW_LENGTHS := 'row_lengths' DIGITS (COMMA DIGITS)*

116

NODES := NODE_COMPRESSED*

117

NODE_COMPRESSED:= COMPRESSED_BYTES{4096}

118

NODE_RAW := INTERNAL | LEAF

119

INTERNAL := INTERNAL_FLAG POINTERS

120

LEAF := LEAF_FLAG ROWS

121

KEY_ELEMENT := Not-whitespace-utf8

122

KEY := KEY_ELEMENT (NULL KEY_ELEMENT)*

123

ROWS := ROW*

124

ROW := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

125

ABSENT := 'a'

126

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

127

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

128

REFERENCE := KEY

129

VALUE := no-newline-no-null-bytes

130

"""

131

132

def __init__(self, reference_lists=0, key_elements=1, spill_at=100000):

133

"""See GraphIndexBuilder.__init__.

134

135

:param spill_at: Optional parameter controlling the maximum number

136

of nodes that BTreeBuilder will hold in memory.

137

"""

138

index.GraphIndexBuilder.__init__(self, reference_lists=reference_lists,

139

key_elements=key_elements)

140

self._spill_at = spill_at

141

self._backing_indices = []

142

# A map of {key: (node_refs, value)}

143

self._nodes = {}

144

# Indicate it hasn't been built yet

145

self._nodes_by_key = None

146

self._optimize_for_size = False

147

148

def add_node(self, key, value, references=()):

149

"""Add a node to the index.

150

151

If adding the node causes the builder to reach its spill_at threshold,

152

disk spilling will be triggered.

153

154

:param key: The key. keys are non-empty tuples containing

155

as many whitespace-free utf8 bytestrings as the key length

156

defined for this index.

157

:param references: An iterable of iterables of keys. Each is a

158

reference to another key.

159

:param value: The value to associate with the key. It may be any

160

bytes as long as it does not contain \0 or \n.

161

"""

162

# we don't care about absent_references

163

node_refs, _ = self._check_key_ref_value(key, references, value)

164

if key in self._nodes:

165

raise errors.BadIndexDuplicateKey(key, self)

166

# TODO: StaticTuple

167

self._nodes[key] = (node_refs, value)

168

self._keys.add(key)

169

if self._nodes_by_key is not None and self._key_length > 1:

170

self._update_nodes_by_key(key, value, node_refs)

171

if len(self._keys) < self._spill_at:

172

return

173

self._spill_mem_keys_to_disk()

174

175

def _spill_mem_keys_to_disk(self):

176

"""Write the in memory keys down to disk to cap memory consumption.

177

178

If we already have some keys written to disk, we will combine them so

179

as to preserve the sorted order. The algorithm for combining uses

180

powers of two. So on the first spill, write all mem nodes into a

181

single index. On the second spill, combine the mem nodes with the nodes

182

on disk to create a 2x sized disk index and get rid of the first index.

183

On the third spill, create a single new disk index, which will contain

184

the mem nodes, and preserve the existing 2x sized index. On the fourth,

185

combine mem with the first and second indexes, creating a new one of

186

size 4x. On the fifth create a single new one, etc.

187

"""

188

if self._combine_backing_indices:

189

(new_backing_file, size,

190

backing_pos) = self._spill_mem_keys_and_combine()

191

else:

192

new_backing_file, size = self._spill_mem_keys_without_combining()

193

# Note: The transport here isn't strictly needed, because we will use

194

# direct access to the new_backing._file object

195

new_backing = BTreeGraphIndex(get_transport('.'), '<temp>', size)

196

# GC will clean up the file

197

new_backing._file = new_backing_file

198

if self._combine_backing_indices:

199

if len(self._backing_indices) == backing_pos:

200

self._backing_indices.append(None)

201

self._backing_indices[backing_pos] = new_backing

202

for backing_pos in range(backing_pos):

203

self._backing_indices[backing_pos] = None

204

else:

205

self._backing_indices.append(new_backing)

206

self._keys = set()

207

self._nodes = {}

208

self._nodes_by_key = None

209

210

def _spill_mem_keys_without_combining(self):

211

return self._write_nodes(self._iter_mem_nodes(), allow_optimize=False)

212

213

def _spill_mem_keys_and_combine(self):

214

iterators_to_combine = [self._iter_mem_nodes()]

215

pos = -1

216

for pos, backing in enumerate(self._backing_indices):

217

if backing is None:

218

pos -= 1

219

break

220

iterators_to_combine.append(backing.iter_all_entries())

221

backing_pos = pos + 1

222

new_backing_file, size = \

223

self._write_nodes(self._iter_smallest(iterators_to_combine),

224

allow_optimize=False)

225

return new_backing_file, size, backing_pos

226

227

def add_nodes(self, nodes):

228

"""Add nodes to the index.

229

230

:param nodes: An iterable of (key, node_refs, value) entries to add.

231

"""

232

if self.reference_lists:

233

for (key, value, node_refs) in nodes:

234

self.add_node(key, value, node_refs)

235

else:

236

for (key, value) in nodes:

237

self.add_node(key, value)

238

239

def _iter_mem_nodes(self):

240

"""Iterate over the nodes held in memory."""

241

nodes = self._nodes

242

if self.reference_lists:

243

for key in sorted(nodes):

244

references, value = nodes[key]

245

yield self, key, value, references

246

else:

247

for key in sorted(nodes):

248

references, value = nodes[key]

249

yield self, key, value

250

251

def _iter_smallest(self, iterators_to_combine):

252

if len(iterators_to_combine) == 1:

253

for value in iterators_to_combine[0]:

254

yield value

255

return

256

current_values = []

257

for iterator in iterators_to_combine:

258

try:

259

current_values.append(iterator.next())

260

except StopIteration:

261

current_values.append(None)

262

last = None

263

while True:

264

# Decorate candidates with the value to allow 2.4's min to be used.

265

candidates = [(item[1][1], item) for item

266

in enumerate(current_values) if item[1] is not None]

267

if not len(candidates):

268

return

269

selected = min(candidates)

270

# undecorate back to (pos, node)

271

selected = selected[1]

272

if last == selected[1][1]:

273

raise errors.BadIndexDuplicateKey(last, self)

274

last = selected[1][1]

275

# Yield, with self as the index

276

yield (self,) + selected[1][1:]

277

pos = selected[0]

278

try:

279

current_values[pos] = iterators_to_combine[pos].next()

280

except StopIteration:

281

current_values[pos] = None

282

283

def _add_key(self, string_key, line, rows, allow_optimize=True):

284

"""Add a key to the current chunk.

285

286

:param string_key: The key to add.

287

:param line: The fully serialised key and value.

288

:param allow_optimize: If set to False, prevent setting the optimize

289

flag when writing out. This is used by the _spill_mem_keys_to_disk

290

functionality.

291

"""

292

if rows[-1].writer is None:

293

# opening a new leaf chunk;

294

for pos, internal_row in enumerate(rows[:-1]):

295

# flesh out any internal nodes that are needed to

296

# preserve the height of the tree

297

if internal_row.writer is None:

298

length = _PAGE_SIZE

299

if internal_row.nodes == 0:

300

length -= _RESERVED_HEADER_BYTES # padded

301

if allow_optimize:

302

optimize_for_size = self._optimize_for_size

303

else:

304

optimize_for_size = False

305

internal_row.writer = chunk_writer.ChunkWriter(length, 0,

306

optimize_for_size=optimize_for_size)

307

internal_row.writer.write(_INTERNAL_FLAG)

308

internal_row.writer.write(_INTERNAL_OFFSET +

309

str(rows[pos + 1].nodes) + "\n")

310

# add a new leaf

311

length = _PAGE_SIZE

312

if rows[-1].nodes == 0:

313

length -= _RESERVED_HEADER_BYTES # padded

314

rows[-1].writer = chunk_writer.ChunkWriter(length,

315

optimize_for_size=self._optimize_for_size)

316

rows[-1].writer.write(_LEAF_FLAG)

317

if rows[-1].writer.write(line):

318

# this key did not fit in the node:

319

rows[-1].finish_node()

320

key_line = string_key + "\n"

321

new_row = True

322

for row in reversed(rows[:-1]):

323

# Mark the start of the next node in the node above. If it

324

# doesn't fit then propagate upwards until we find one that

325

# it does fit into.

326

if row.writer.write(key_line):

327

row.finish_node()

328

else:

329

# We've found a node that can handle the pointer.

330

new_row = False

331

break

332

# If we reached the current root without being able to mark the

333

# division point, then we need a new root:

334

if new_row:

335

# We need a new row

336

if 'index' in debug.debug_flags:

337

trace.mutter('Inserting new global row.')

338

new_row = _InternalBuilderRow()

339

reserved_bytes = 0

340

rows.insert(0, new_row)

341

# This will be padded, hence the -100

342

new_row.writer = chunk_writer.ChunkWriter(

343

_PAGE_SIZE - _RESERVED_HEADER_BYTES,

344

reserved_bytes,

345

optimize_for_size=self._optimize_for_size)

346

new_row.writer.write(_INTERNAL_FLAG)

347

new_row.writer.write(_INTERNAL_OFFSET +

348

str(rows[1].nodes - 1) + "\n")

349

new_row.writer.write(key_line)

350

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

351

352

def _write_nodes(self, node_iterator, allow_optimize=True):

353

"""Write node_iterator out as a B+Tree.

354

355

:param node_iterator: An iterator of sorted nodes. Each node should

356

match the output given by iter_all_entries.

357

:param allow_optimize: If set to False, prevent setting the optimize

358

flag when writing out. This is used by the _spill_mem_keys_to_disk

359

functionality.

360

:return: A file handle for a temporary file containing a B+Tree for

361

the nodes.

362

"""

363

# The index rows - rows[0] is the root, rows[1] is the layer under it

364

# etc.

365

rows = []

366

# forward sorted by key. In future we may consider topological sorting,

367

# at the cost of table scans for direct lookup, or a second index for

368

# direct lookup

369

key_count = 0

370

# A stack with the number of nodes of each size. 0 is the root node

371

# and must always be 1 (if there are any nodes in the tree).

372

self.row_lengths = []

373

# Loop over all nodes adding them to the bottom row

374

# (rows[-1]). When we finish a chunk in a row,

375

# propagate the key that didn't fit (comes after the chunk) to the

376

# row above, transitively.

377

for node in node_iterator:

378

if key_count == 0:

379

# First key triggers the first row

380

rows.append(_LeafBuilderRow())

381

key_count += 1

382

string_key, line = _btree_serializer._flatten_node(node,

383

self.reference_lists)

384

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

385

for row in reversed(rows):

386

pad = (type(row) != _LeafBuilderRow)

387

row.finish_node(pad=pad)

388

lines = [_BTSIGNATURE]

389

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

390

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

391

lines.append(_OPTION_LEN + str(key_count) + '\n')

392

row_lengths = [row.nodes for row in rows]

393

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

394

if row_lengths and row_lengths[-1] > 1:

395

result = tempfile.NamedTemporaryFile(prefix='bzr-index-')

396

else:

397

result = cStringIO.StringIO()

398

result.writelines(lines)

399

position = sum(map(len, lines))

400

root_row = True

401

if position > _RESERVED_HEADER_BYTES:

402

raise AssertionError("Could not fit the header in the"

403

" reserved space: %d > %d"

404

% (position, _RESERVED_HEADER_BYTES))

405

# write the rows out:

406

for row in rows:

407

reserved = _RESERVED_HEADER_BYTES # reserved space for first node

408

row.spool.flush()

409

row.spool.seek(0)

410

# copy nodes to the finalised file.

411

# Special case the first node as it may be prefixed

412

node = row.spool.read(_PAGE_SIZE)

413

result.write(node[reserved:])

414

result.write("\x00" * (reserved - position))

415

position = 0 # Only the root row actually has an offset

416

copied_len = osutils.pumpfile(row.spool, result)

417

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

418

if type(row) != _LeafBuilderRow:

419

raise AssertionError("Incorrect amount of data copied"

420

" expected: %d, got: %d"

421

% ((row.nodes - 1) * _PAGE_SIZE,

422

copied_len))

423

result.flush()

424

size = result.tell()

425

result.seek(0)

426

return result, size

427

428

def finish(self):

429

"""Finalise the index.

430

431

:return: A file handle for a temporary file containing the nodes added

432

to the index.

433

"""

434

return self._write_nodes(self.iter_all_entries())[0]

435

436

def iter_all_entries(self):

437

"""Iterate over all keys within the index

438

439

:return: An iterable of (index, key, value, reference_lists). There is

440

no defined order for the result iteration - it will be in the most

441

efficient order for the index (in this case dictionary hash order).

442

"""

443

if 'evil' in debug.debug_flags:

444

trace.mutter_callsite(3,

445

"iter_all_entries scales with size of history.")

446

# Doing serial rather than ordered would be faster; but this shouldn't

447

# be getting called routinely anyway.

448

iterators = [self._iter_mem_nodes()]

449

for backing in self._backing_indices:

450

if backing is not None:

451

iterators.append(backing.iter_all_entries())

452

if len(iterators) == 1:

453

return iterators[0]

454

return self._iter_smallest(iterators)

455

456

def iter_entries(self, keys):

457

"""Iterate over keys within the index.

458

459

:param keys: An iterable providing the keys to be retrieved.

460

:return: An iterable of (index, key, value, reference_lists). There is no

461

defined order for the result iteration - it will be in the most

462

efficient order for the index (keys iteration order in this case).

463

"""

464

keys = set(keys)

465

local_keys = keys.intersection(self._keys)

466

if self.reference_lists:

467

for key in local_keys:

468

node = self._nodes[key]

469

yield self, key, node[1], node[0]

470

else:

471

for key in local_keys:

472

node = self._nodes[key]

473

yield self, key, node[1]

474

# Find things that are in backing indices that have not been handled

475

# yet.

476

if not self._backing_indices:

477

return # We won't find anything there either

478

# Remove all of the keys that we found locally

479

keys.difference_update(local_keys)

480

for backing in self._backing_indices:

481

if backing is None:

482

continue

483

if not keys:

484

return

485

for node in backing.iter_entries(keys):

486

keys.remove(node[1])

487

yield (self,) + node[1:]

488

489

def iter_entries_prefix(self, keys):

490

"""Iterate over keys within the index using prefix matching.

491

492

Prefix matching is applied within the tuple of a key, not to within

493

the bytestring of each key element. e.g. if you have the keys ('foo',

494

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

495

only the former key is returned.

496

497

:param keys: An iterable providing the key prefixes to be retrieved.

498

Each key prefix takes the form of a tuple the length of a key, but

499

with the last N elements 'None' rather than a regular bytestring.

500

The first element cannot be 'None'.

501

:return: An iterable as per iter_all_entries, but restricted to the

502

keys with a matching prefix to those supplied. No additional keys

503

will be returned, and every match that is in the index will be

504

returned.

505

"""

506

# XXX: To much duplication with the GraphIndex class; consider finding

507

# a good place to pull out the actual common logic.

508

keys = set(keys)

509

if not keys:

510

return

511

for backing in self._backing_indices:

512

if backing is None:

513

continue

514

for node in backing.iter_entries_prefix(keys):

515

yield (self,) + node[1:]

516

if self._key_length == 1:

517

for key in keys:

518

# sanity check

519

if key[0] is None:

520

raise errors.BadIndexKey(key)

521

if len(key) != self._key_length:

522

raise errors.BadIndexKey(key)

523

try:

524

node = self._nodes[key]

525

except KeyError:

526

continue

527

if self.reference_lists:

528

yield self, key, node[1], node[0]

529

else:

530

yield self, key, node[1]

531

return

532

for key in keys:

533

# sanity check

534

if key[0] is None:

535

raise errors.BadIndexKey(key)

536

if len(key) != self._key_length:

537

raise errors.BadIndexKey(key)

538

# find what it refers to:

539

key_dict = self._get_nodes_by_key()

540

elements = list(key)

541

# find the subdict to return

542

try:

543

while len(elements) and elements[0] is not None:

544

key_dict = key_dict[elements[0]]

545

elements.pop(0)

546

except KeyError:

547

# a non-existant lookup.

548

continue

549

if len(elements):

550

dicts = [key_dict]

551

while dicts:

552

key_dict = dicts.pop(-1)

553

# can't be empty or would not exist

554

item, value = key_dict.iteritems().next()

555

if type(value) == dict:

556

# push keys

557

dicts.extend(key_dict.itervalues())

558

else:

559

# yield keys

560

for value in key_dict.itervalues():

561

yield (self, ) + value

562

else:

563

yield (self, ) + key_dict

564

565

def _get_nodes_by_key(self):

566

if self._nodes_by_key is None:

567

nodes_by_key = {}

568

if self.reference_lists:

569

for key, (references, value) in self._nodes.iteritems():

570

key_dict = nodes_by_key

571

for subkey in key[:-1]:

572

key_dict = key_dict.setdefault(subkey, {})

573

key_dict[key[-1]] = key, value, references

574

else:

575

for key, (references, value) in self._nodes.iteritems():

576

key_dict = nodes_by_key

577

for subkey in key[:-1]:

578

key_dict = key_dict.setdefault(subkey, {})

579

key_dict[key[-1]] = key, value

580

self._nodes_by_key = nodes_by_key

581

return self._nodes_by_key

582

583

def key_count(self):

584

"""Return an estimate of the number of keys in this index.

585

586

For InMemoryGraphIndex the estimate is exact.

587

"""

588

return len(self._keys) + sum(backing.key_count() for backing in

589

self._backing_indices if backing is not None)

590

591

def validate(self):

592

"""In memory index's have no known corruption at the moment."""

593

594

595

class _LeafNode(object):

596

"""A leaf node for a serialised B+Tree index."""

597

598

__slots__ = ('keys', 'min_key', 'max_key')

599

600

def __init__(self, bytes, key_length, ref_list_length):

601

"""Parse bytes to create a leaf node object."""

602

# splitlines mangles the \r delimiters.. don't use it.

603

key_list = _btree_serializer._parse_leaf_lines(bytes,

604

key_length, ref_list_length)

605

if key_list:

606

self.min_key = key_list[0][0]

607

self.max_key = key_list[-1][0]

608

else:

609

self.min_key = self.max_key = None

610

self.keys = dict(key_list)

611

612

613

class _InternalNode(object):

614

"""An internal node for a serialised B+Tree index."""

615

616

__slots__ = ('keys', 'offset')

617

618

def __init__(self, bytes):

619

"""Parse bytes to create an internal node object."""

620

# splitlines mangles the \r delimiters.. don't use it.

621

self.keys = self._parse_lines(bytes.split('\n'))

622

623

def _parse_lines(self, lines):

624

nodes = []

625

self.offset = int(lines[1][7:])

626

for line in lines[2:]:

627

if line == '':

628

break

629

# TODO: Switch to StaticTuple here.

630

nodes.append(tuple(map(intern, line.split('\0'))))

631

return nodes

632

633

634

class BTreeGraphIndex(object):

635

"""Access to nodes via the standard GraphIndex interface for B+Tree's.

636

637

Individual nodes are held in a LRU cache. This holds the root node in

638

memory except when very large walks are done.

639

"""

640

641

def __init__(self, transport, name, size, unlimited_cache=False):

642

"""Create a B+Tree index object on the index name.

643

644

:param transport: The transport to read data for the index from.

645

:param name: The file name of the index on transport.

646

:param size: Optional size of the index in bytes. This allows

647

compatibility with the GraphIndex API, as well as ensuring that

648

the initial read (to read the root node header) can be done

649

without over-reading even on empty indices, and on small indices

650

allows single-IO to read the entire index.

651

:param unlimited_cache: If set to True, then instead of using an

652

LRUCache with size _NODE_CACHE_SIZE, we will use a dict and always

653

cache all leaf nodes.

654

"""

655

self._transport = transport

656

self._name = name

657

self._size = size

658

self._file = None

659

self._recommended_pages = self._compute_recommended_pages()

660

self._root_node = None

661

# Default max size is 100,000 leave values

662

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

663

if unlimited_cache:

664

self._leaf_node_cache = {}

665

self._internal_node_cache = {}

666

else:

667

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

668

# We use a FIFO here just to prevent possible blowout. However, a

669

# 300k record btree has only 3k leaf nodes, and only 20 internal

670

# nodes. A value of 100 scales to ~100*100*100 = 1M records.

671

self._internal_node_cache = fifo_cache.FIFOCache(100)

672

self._key_count = None

673

self._row_lengths = None

674

self._row_offsets = None # Start of each row, [-1] is the end

675

676

def __eq__(self, other):

677

"""Equal when self and other were created with the same parameters."""

678

return (

679

type(self) == type(other) and

680

self._transport == other._transport and

681

self._name == other._name and

682

self._size == other._size)

683

684

def __ne__(self, other):

685

return not self.__eq__(other)

686

687

def _get_and_cache_nodes(self, nodes):

688

"""Read nodes and cache them in the lru.

689

690

The nodes list supplied is sorted and then read from disk, each node

691

being inserted it into the _node_cache.

692

693

Note: Asking for more nodes than the _node_cache can contain will

694

result in some of the results being immediately discarded, to prevent

695

this an assertion is raised if more nodes are asked for than are

696

cachable.

697

698

:return: A dict of {node_pos: node}

699

"""

700

found = {}

701

start_of_leaves = None

702

for node_pos, node in self._read_nodes(sorted(nodes)):

703

if node_pos == 0: # Special case

704

self._root_node = node

705

else:

706

if start_of_leaves is None:

707

start_of_leaves = self._row_offsets[-2]

708

if node_pos < start_of_leaves:

709

self._internal_node_cache[node_pos] = node

710

else:

711

self._leaf_node_cache[node_pos] = node

712

found[node_pos] = node

713

return found

714

715

def _compute_recommended_pages(self):

716

"""Convert transport's recommended_page_size into btree pages.

717

718

recommended_page_size is in bytes, we want to know how many _PAGE_SIZE

719

pages fit in that length.

720

"""

721

recommended_read = self._transport.recommended_page_size()

722

recommended_pages = int(math.ceil(recommended_read /

723

float(_PAGE_SIZE)))

724

return recommended_pages

725

726

def _compute_total_pages_in_index(self):

727

"""How many pages are in the index.

728

729

If we have read the header we will use the value stored there.

730

Otherwise it will be computed based on the length of the index.

731

"""

732

if self._size is None:

733

raise AssertionError('_compute_total_pages_in_index should not be'

734

' called when self._size is None')

735

if self._root_node is not None:

736

# This is the number of pages as defined by the header

737

return self._row_offsets[-1]

738

# This is the number of pages as defined by the size of the index. They

739

# should be indentical.

740

total_pages = int(math.ceil(self._size / float(_PAGE_SIZE)))

741

return total_pages

742

743

def _expand_offsets(self, offsets):

744

"""Find extra pages to download.

745

746

The idea is that we always want to make big-enough requests (like 64kB

747

for http), so that we don't waste round trips. So given the entries

748

that we already have cached and the new pages being downloaded figure

749

out what other pages we might want to read.

750

751

See also doc/developers/btree_index_prefetch.txt for more details.

752

753

:param offsets: The offsets to be read

754

:return: A list of offsets to download

755

"""

756

if 'index' in debug.debug_flags:

757

trace.mutter('expanding: %s\toffsets: %s', self._name, offsets)

758

759

if len(offsets) >= self._recommended_pages:

760

# Don't add more, we are already requesting more than enough

761

if 'index' in debug.debug_flags:

762

trace.mutter(' not expanding large request (%s >= %s)',

763

len(offsets), self._recommended_pages)

764

return offsets

765

if self._size is None:

766

# Don't try anything, because we don't know where the file ends

767

if 'index' in debug.debug_flags:

768

trace.mutter(' not expanding without knowing index size')

769

return offsets

770

total_pages = self._compute_total_pages_in_index()

771

cached_offsets = self._get_offsets_to_cached_pages()

772

# If reading recommended_pages would read the rest of the index, just

773

# do so.

774

if total_pages - len(cached_offsets) <= self._recommended_pages:

775

# Read whatever is left

776

if cached_offsets:

777

expanded = [x for x in xrange(total_pages)

778

if x not in cached_offsets]

779

else:

780

expanded = range(total_pages)

781

if 'index' in debug.debug_flags:

782

trace.mutter(' reading all unread pages: %s', expanded)

783

return expanded

784

785

if self._root_node is None:

786

# ATM on the first read of the root node of a large index, we don't

787

# bother pre-reading any other pages. This is because the

788

# likelyhood of actually reading interesting pages is very low.

789

# See doc/developers/btree_index_prefetch.txt for a discussion, and

790

# a possible implementation when we are guessing that the second

791

# layer index is small

792

final_offsets = offsets

793

else:

794

tree_depth = len(self._row_lengths)

795

if len(cached_offsets) < tree_depth and len(offsets) == 1:

796

# We haven't read enough to justify expansion

797

# If we are only going to read the root node, and 1 leaf node,

798

# then it isn't worth expanding our request. Once we've read at

799

# least 2 nodes, then we are probably doing a search, and we

800

# start expanding our requests.

801

if 'index' in debug.debug_flags:

802

trace.mutter(' not expanding on first reads')

803

return offsets

804

final_offsets = self._expand_to_neighbors(offsets, cached_offsets,

805

total_pages)

806

807

final_offsets = sorted(final_offsets)

808

if 'index' in debug.debug_flags:

809

trace.mutter('expanded: %s', final_offsets)

810

return final_offsets

811

812

def _expand_to_neighbors(self, offsets, cached_offsets, total_pages):

813

"""Expand requests to neighbors until we have enough pages.

814

815

This is called from _expand_offsets after policy has determined that we

816

want to expand.

817

We only want to expand requests within a given layer. We cheat a little

818

bit and assume all requests will be in the same layer. This is true

819

given the current design, but if it changes this algorithm may perform

820

oddly.

821

822

:param offsets: requested offsets

823

:param cached_offsets: offsets for pages we currently have cached

824

:return: A set() of offsets after expansion

825

"""

826

final_offsets = set(offsets)

827

first = end = None

828

new_tips = set(final_offsets)

829

while len(final_offsets) < self._recommended_pages and new_tips:

830

next_tips = set()

831

for pos in new_tips:

832

if first is None:

833

first, end = self._find_layer_first_and_end(pos)

834

previous = pos - 1

835

if (previous > 0

836

and previous not in cached_offsets

837

and previous not in final_offsets

838

and previous >= first):

839

next_tips.add(previous)

840

after = pos + 1

841

if (after < total_pages

842

and after not in cached_offsets

843

and after not in final_offsets

844

and after < end):

845

next_tips.add(after)

846

# This would keep us from going bigger than

847

# recommended_pages by only expanding the first offsets.

848

# However, if we are making a 'wide' request, it is

849

# reasonable to expand all points equally.

850

# if len(final_offsets) > recommended_pages:

851

# break

852

final_offsets.update(next_tips)

853

new_tips = next_tips

854

return final_offsets

855

856

def clear_cache(self):

857

"""Clear out any cached/memoized values.

858

859

This can be called at any time, but generally it is used when we have

860

extracted some information, but don't expect to be requesting any more

861

from this index.

862

"""

863

# Note that we don't touch self._root_node or self._internal_node_cache

864

# We don't expect either of those to be big, and it can save

865

# round-trips in the future. We may re-evaluate this if InternalNode

866

# memory starts to be an issue.

867

self._leaf_node_cache.clear()

868

869

def external_references(self, ref_list_num):

870

if self._root_node is None:

871

self._get_root_node()

872

if ref_list_num + 1 > self.node_ref_lists:

873

raise ValueError('No ref list %d, index has %d ref lists'

874

% (ref_list_num, self.node_ref_lists))

875

keys = set()

876

refs = set()

877

for node in self.iter_all_entries():

878

keys.add(node[1])

879

refs.update(node[3][ref_list_num])

880

return refs - keys

881

882

def _find_layer_first_and_end(self, offset):

883

"""Find the start/stop nodes for the layer corresponding to offset.

884

885

:return: (first, end)

886

first is the first node in this layer

887

end is the first node of the next layer

888

"""

889

first = end = 0

890

for roffset in self._row_offsets:

891

first = end

892

end = roffset

893

if offset < roffset:

894

break

895

return first, end

896

897

def _get_offsets_to_cached_pages(self):

898

"""Determine what nodes we already have cached."""

899

cached_offsets = set(self._internal_node_cache.keys())

900

cached_offsets.update(self._leaf_node_cache.keys())

901

if self._root_node is not None:

902

cached_offsets.add(0)

903

return cached_offsets

904

905

def _get_root_node(self):

906

if self._root_node is None:

907

# We may not have a root node yet

908

self._get_internal_nodes([0])

909

return self._root_node

910

911

def _get_nodes(self, cache, node_indexes):

912

found = {}

913

needed = []

914

for idx in node_indexes:

915

if idx == 0 and self._root_node is not None:

916

found[0] = self._root_node

917

continue

918

try:

919

found[idx] = cache[idx]

920

except KeyError:

921

needed.append(idx)

922

if not needed:

923

return found

924

needed = self._expand_offsets(needed)

925

found.update(self._get_and_cache_nodes(needed))

926

return found

927

928

def _get_internal_nodes(self, node_indexes):

929

"""Get a node, from cache or disk.

930

931

After getting it, the node will be cached.

932

"""

933

return self._get_nodes(self._internal_node_cache, node_indexes)

934

935

def _cache_leaf_values(self, nodes):

936

"""Cache directly from key => value, skipping the btree."""

937

if self._leaf_value_cache is not None:

938

for node in nodes.itervalues():

939

for key, value in node.keys.iteritems():

940

if key in self._leaf_value_cache:

941

# Don't add the rest of the keys, we've seen this node

942

# before.

943

break

944

self._leaf_value_cache[key] = value

945

946

def _get_leaf_nodes(self, node_indexes):

947

"""Get a bunch of nodes, from cache or disk."""

948

found = self._get_nodes(self._leaf_node_cache, node_indexes)

949

self._cache_leaf_values(found)

950

return found

951

952

def iter_all_entries(self):

953

"""Iterate over all keys within the index.

954

955

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

956

The former tuple is used when there are no reference lists in the

957

index, making the API compatible with simple key:value index types.

958

There is no defined order for the result iteration - it will be in

959

the most efficient order for the index.

960

"""

961

if 'evil' in debug.debug_flags:

962

trace.mutter_callsite(3,

963

"iter_all_entries scales with size of history.")

964

if not self.key_count():

965

return

966

if self._row_offsets[-1] == 1:

967

# There is only the root node, and we read that via key_count()

968

if self.node_ref_lists:

969

for key, (value, refs) in sorted(self._root_node.keys.items()):

970

yield (self, key, value, refs)

971

else:

972

for key, (value, refs) in sorted(self._root_node.keys.items()):

973

yield (self, key, value)

974

return

975

start_of_leaves = self._row_offsets[-2]

976

end_of_leaves = self._row_offsets[-1]

977

needed_offsets = range(start_of_leaves, end_of_leaves)

978

if needed_offsets == [0]:

979

# Special case when we only have a root node, as we have already

980

# read everything

981

nodes = [(0, self._root_node)]

982

else:

983

nodes = self._read_nodes(needed_offsets)

984

# We iterate strictly in-order so that we can use this function

985

# for spilling index builds to disk.

986

if self.node_ref_lists:

987

for _, node in nodes:

988

for key, (value, refs) in sorted(node.keys.items()):

989

yield (self, key, value, refs)

990

else:

991

for _, node in nodes:

992

for key, (value, refs) in sorted(node.keys.items()):

993

yield (self, key, value)

994

995

@staticmethod

996

def _multi_bisect_right(in_keys, fixed_keys):

997

"""Find the positions where each 'in_key' would fit in fixed_keys.

998

999

This is equivalent to doing "bisect_right" on each in_key into

1000

fixed_keys

1001

1002

:param in_keys: A sorted list of keys to match with fixed_keys

1003

:param fixed_keys: A sorted list of keys to match against

1004

:return: A list of (integer position, [key list]) tuples.

1005

"""

1006

if not in_keys:

1007

return []

1008

if not fixed_keys:

1009

# no pointers in the fixed_keys list, which means everything must

1010

# fall to the left.

1011

return [(0, in_keys)]

1012

1013

# TODO: Iterating both lists will generally take M + N steps

1014

# Bisecting each key will generally take M * log2 N steps.

1015

# If we had an efficient way to compare, we could pick the method

1016

# based on which has the fewer number of steps.

1017

# There is also the argument that bisect_right is a compiled

1018

# function, so there is even more to be gained.

1019

# iter_steps = len(in_keys) + len(fixed_keys)

1020

# bisect_steps = len(in_keys) * math.log(len(fixed_keys), 2)

1021

if len(in_keys) == 1: # Bisect will always be faster for M = 1

1022

return [(bisect_right(fixed_keys, in_keys[0]), in_keys)]

1023

# elif bisect_steps < iter_steps:

1024

# offsets = {}

1025

# for key in in_keys:

1026

# offsets.setdefault(bisect_right(fixed_keys, key),

1027

# []).append(key)

1028

# return [(o, offsets[o]) for o in sorted(offsets)]

1029

in_keys_iter = iter(in_keys)

1030

fixed_keys_iter = enumerate(fixed_keys)

1031

cur_in_key = in_keys_iter.next()

1032

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1033

1034

class InputDone(Exception): pass

1035

class FixedDone(Exception): pass

1036

1037

output = []

1038

cur_out = []

1039

1040

# TODO: Another possibility is that rather than iterating on each side,

1041

# we could use a combination of bisecting and iterating. For

1042

# example, while cur_in_key < fixed_key, bisect to find its

1043

# point, then iterate all matching keys, then bisect (restricted

1044

# to only the remainder) for the next one, etc.

1045

try:

1046

while True:

1047

if cur_in_key < cur_fixed_key:

1048

cur_keys = []

1049

cur_out = (cur_fixed_offset, cur_keys)

1050

output.append(cur_out)

1051

while cur_in_key < cur_fixed_key:

1052

cur_keys.append(cur_in_key)

1053

try:

1054

cur_in_key = in_keys_iter.next()

1055

except StopIteration:

1056

raise InputDone

1057

# At this point cur_in_key must be >= cur_fixed_key

1058

# step the cur_fixed_key until we pass the cur key, or walk off

1059

# the end

1060

while cur_in_key >= cur_fixed_key:

1061

try:

1062

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1063

except StopIteration:

1064

raise FixedDone

1065

except InputDone:

1066

# We consumed all of the input, nothing more to do

1067

pass

1068

except FixedDone:

1069

# There was some input left, but we consumed all of fixed, so we

1070

# have to add one more for the tail

1071

cur_keys = [cur_in_key]

1072

cur_keys.extend(in_keys_iter)

1073

cur_out = (len(fixed_keys), cur_keys)

1074

output.append(cur_out)

1075

return output

1076

1077

def _walk_through_internal_nodes(self, keys):

1078

"""Take the given set of keys, and find the corresponding LeafNodes.

1079

1080

:param keys: An unsorted iterable of keys to search for

1081

:return: (nodes, index_and_keys)

1082

nodes is a dict mapping {index: LeafNode}

1083

keys_at_index is a list of tuples of [(index, [keys for Leaf])]

1084

"""

1085

# 6 seconds spent in miss_torture using the sorted() line.

1086

# Even with out of order disk IO it seems faster not to sort it when

1087

# large queries are being made.

1088

keys_at_index = [(0, sorted(keys))]

1089

1090

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1091

node_indexes = [idx for idx, s_keys in keys_at_index]

1092

nodes = self._get_internal_nodes(node_indexes)

1093

1094

next_nodes_and_keys = []

1095

for node_index, sub_keys in keys_at_index:

1096

node = nodes[node_index]

1097

positions = self._multi_bisect_right(sub_keys, node.keys)

1098

node_offset = next_row_start + node.offset

1099

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1100

for pos, s_keys in positions])

1101

keys_at_index = next_nodes_and_keys

1102

# We should now be at the _LeafNodes

1103

node_indexes = [idx for idx, s_keys in keys_at_index]

1104

1105

# TODO: We may *not* want to always read all the nodes in one

1106

# big go. Consider setting a max size on this.

1107

nodes = self._get_leaf_nodes(node_indexes)

1108

return nodes, keys_at_index

1109

1110

def iter_entries(self, keys):

1111

"""Iterate over keys within the index.

1112

1113

:param keys: An iterable providing the keys to be retrieved.

1114

:return: An iterable as per iter_all_entries, but restricted to the

1115

keys supplied. No additional keys will be returned, and every

1116

key supplied that is in the index will be returned.

1117

"""

1118

# 6 seconds spent in miss_torture using the sorted() line.

1119

# Even with out of order disk IO it seems faster not to sort it when

1120

# large queries are being made.

1121

# However, now that we are doing multi-way bisecting, we need the keys

1122

# in sorted order anyway. We could change the multi-way code to not

1123

# require sorted order. (For example, it bisects for the first node,

1124

# does an in-order search until a key comes before the current point,

1125

# which it then bisects for, etc.)

1126

keys = frozenset(keys)

1127

if not keys:

1128

return

1129

1130

if not self.key_count():

1131

return

1132

1133

needed_keys = []

1134

if self._leaf_value_cache is None:

1135

needed_keys = keys

1136

else:

1137

for key in keys:

1138

value = self._leaf_value_cache.get(key, None)

1139

if value is not None:

1140

# This key is known not to be here, skip it

1141

value, refs = value

1142

if self.node_ref_lists:

1143

yield (self, key, value, refs)

1144

else:

1145

yield (self, key, value)

1146

else:

1147

needed_keys.append(key)

1148

1149

last_key = None

1150

needed_keys = keys

1151

if not needed_keys:

1152

return

1153

nodes, nodes_and_keys = self._walk_through_internal_nodes(needed_keys)

1154

for node_index, sub_keys in nodes_and_keys:

1155

if not sub_keys:

1156

continue

1157

node = nodes[node_index]

1158

for next_sub_key in sub_keys:

1159

if next_sub_key in node.keys:

1160

value, refs = node.keys[next_sub_key]

1161

if self.node_ref_lists:

1162

yield (self, next_sub_key, value, refs)

1163

else:

1164

yield (self, next_sub_key, value)

1165

1166

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

1167

"""Find the parent_map information for the set of keys.

1168

1169

This populates the parent_map dict and missing_keys set based on the

1170

queried keys. It also can fill out an arbitrary number of parents that

1171

it finds while searching for the supplied keys.

1172

1173

It is unlikely that you want to call this directly. See

1174

"CombinedGraphIndex.find_ancestry()" for a more appropriate API.

1175

1176

:param keys: A keys whose ancestry we want to return

1177

Every key will either end up in 'parent_map' or 'missing_keys'.

1178

:param ref_list_num: This index in the ref_lists is the parents we

1179

care about.

1180

:param parent_map: {key: parent_keys} for keys that are present in this

1181

index. This may contain more entries than were in 'keys', that are

1182

reachable ancestors of the keys requested.

1183

:param missing_keys: keys which are known to be missing in this index.

1184

This may include parents that were not directly requested, but we

1185

were able to determine that they are not present in this index.

1186

:return: search_keys parents that were found but not queried to know

1187

if they are missing or present. Callers can re-query this index for

1188

those keys, and they will be placed into parent_map or missing_keys

1189

"""

1190

if not self.key_count():

1191

# We use key_count() to trigger reading the root node and

1192

# determining info about this BTreeGraphIndex

1193

# If we don't have any keys, then everything is missing

1194

missing_keys.update(keys)

1195

return set()

1196

if ref_list_num >= self.node_ref_lists:

1197

raise ValueError('No ref list %d, index has %d ref lists'

1198

% (ref_list_num, self.node_ref_lists))

1199

1200

# The main trick we are trying to accomplish is that when we find a

1201

# key listing its parents, we expect that the parent key is also likely

1202

# to sit on the same page. Allowing us to expand parents quickly

1203

# without suffering the full stack of bisecting, etc.

1204

nodes, nodes_and_keys = self._walk_through_internal_nodes(keys)

1205

1206

# These are parent keys which could not be immediately resolved on the

1207

# page where the child was present. Note that we may already be

1208

# searching for that key, and it may actually be present [or known

1209

# missing] on one of the other pages we are reading.

1210

# TODO:

1211

# We could try searching for them in the immediate previous or next

1212

# page. If they occur "later" we could put them in a pending lookup

1213

# set, and then for each node we read thereafter we could check to

1214

# see if they are present.

1215

# However, we don't know the impact of keeping this list of things

1216

# that I'm going to search for every node I come across from here on

1217

# out.

1218

# It doesn't handle the case when the parent key is missing on a

1219

# page that we *don't* read. So we already have to handle being

1220

# re-entrant for that.

1221

# Since most keys contain a date string, they are more likely to be

1222

# found earlier in the file than later, but we would know that right

1223

# away (key < min_key), and wouldn't keep searching it on every other

1224

# page that we read.

1225

# Mostly, it is an idea, one which should be benchmarked.

1226

parents_not_on_page = set()

1227

1228

for node_index, sub_keys in nodes_and_keys:

1229

if not sub_keys:

1230

continue

1231

# sub_keys is all of the keys we are looking for that should exist

1232

# on this page, if they aren't here, then they won't be found

1233

node = nodes[node_index]

1234

node_keys = node.keys

1235

parents_to_check = set()

1236

for next_sub_key in sub_keys:

1237

if next_sub_key not in node_keys:

1238

# This one is just not present in the index at all

1239

missing_keys.add(next_sub_key)

1240

else:

1241

value, refs = node_keys[next_sub_key]

1242

parent_keys = refs[ref_list_num]

1243

parent_map[next_sub_key] = parent_keys

1244

parents_to_check.update(parent_keys)

1245

# Don't look for things we've already found

1246

parents_to_check = parents_to_check.difference(parent_map)

1247

# this can be used to test the benefit of having the check loop

1248

# inlined.

1249

# parents_not_on_page.update(parents_to_check)

1250

# continue

1251

while parents_to_check:

1252

next_parents_to_check = set()

1253

for key in parents_to_check:

1254

if key in node_keys:

1255

value, refs = node_keys[key]

1256

parent_keys = refs[ref_list_num]

1257

parent_map[key] = parent_keys

1258

next_parents_to_check.update(parent_keys)

1259

else:

1260

# This parent either is genuinely missing, or should be

1261

# found on another page. Perf test whether it is better

1262

# to check if this node should fit on this page or not.

1263

# in the 'everything-in-one-pack' scenario, this *not*

1264

# doing the check is 237ms vs 243ms.

1265

# So slightly better, but I assume the standard 'lots

1266

# of packs' is going to show a reasonable improvement

1267

# from the check, because it avoids 'going around

1268

# again' for everything that is in another index

1269

# parents_not_on_page.add(key)

1270

# Missing for some reason

1271

if key < node.min_key:

1272

# in the case of bzr.dev, 3.4k/5.3k misses are

1273

# 'earlier' misses (65%)

1274

parents_not_on_page.add(key)

1275

elif key > node.max_key:

1276

# This parent key would be present on a different

1277

# LeafNode

1278

parents_not_on_page.add(key)

1279

else:

1280

# assert key != node.min_key and key != node.max_key

1281

# If it was going to be present, it would be on

1282

# *this* page, so mark it missing.

1283

missing_keys.add(key)

1284

parents_to_check = next_parents_to_check.difference(parent_map)

1285

# Might want to do another .difference() from missing_keys

1286

# parents_not_on_page could have been found on a different page, or be

1287

# known to be missing. So cull out everything that has already been

1288

# found.

1289

search_keys = parents_not_on_page.difference(

1290

parent_map).difference(missing_keys)

1291

return search_keys

1292

1293

def iter_entries_prefix(self, keys):

1294

"""Iterate over keys within the index using prefix matching.

1295

1296

Prefix matching is applied within the tuple of a key, not to within

1297

the bytestring of each key element. e.g. if you have the keys ('foo',

1298

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1299

only the former key is returned.

1300

1301

WARNING: Note that this method currently causes a full index parse

1302

unconditionally (which is reasonably appropriate as it is a means for

1303

thunking many small indices into one larger one and still supplies

1304

iter_all_entries at the thunk layer).

1305

1306

:param keys: An iterable providing the key prefixes to be retrieved.

1307

Each key prefix takes the form of a tuple the length of a key, but

1308

with the last N elements 'None' rather than a regular bytestring.

1309

The first element cannot be 'None'.

1310

:return: An iterable as per iter_all_entries, but restricted to the

1311

keys with a matching prefix to those supplied. No additional keys

1312

will be returned, and every match that is in the index will be

1313

returned.

1314

"""

1315

keys = sorted(set(keys))

1316

if not keys:

1317

return

1318

# Load if needed to check key lengths

1319

if self._key_count is None:

1320

self._get_root_node()

1321

# TODO: only access nodes that can satisfy the prefixes we are looking

1322

# for. For now, to meet API usage (as this function is not used by

1323

# current bzrlib) just suck the entire index and iterate in memory.

1324

nodes = {}

1325

if self.node_ref_lists:

1326

if self._key_length == 1:

1327

for _1, key, value, refs in self.iter_all_entries():

1328

nodes[key] = value, refs

1329

else:

1330

nodes_by_key = {}

1331

for _1, key, value, refs in self.iter_all_entries():

1332

key_value = key, value, refs

1333

# For a key of (foo, bar, baz) create

1334

# _nodes_by_key[foo][bar][baz] = key_value

1335

key_dict = nodes_by_key

1336

for subkey in key[:-1]:

1337

key_dict = key_dict.setdefault(subkey, {})

1338

key_dict[key[-1]] = key_value

1339

else:

1340

if self._key_length == 1:

1341

for _1, key, value in self.iter_all_entries():

1342

nodes[key] = value

1343

else:

1344

nodes_by_key = {}

1345

for _1, key, value in self.iter_all_entries():

1346

key_value = key, value

1347

# For a key of (foo, bar, baz) create

1348

# _nodes_by_key[foo][bar][baz] = key_value

1349

key_dict = nodes_by_key

1350

for subkey in key[:-1]:

1351

key_dict = key_dict.setdefault(subkey, {})

1352

key_dict[key[-1]] = key_value

1353

if self._key_length == 1:

1354

for key in keys:

1355

# sanity check

1356

if key[0] is None:

1357

raise errors.BadIndexKey(key)

1358

if len(key) != self._key_length:

1359

raise errors.BadIndexKey(key)

1360

try:

1361

if self.node_ref_lists:

1362

value, node_refs = nodes[key]

1363

yield self, key, value, node_refs

1364

else:

1365

yield self, key, nodes[key]

1366

except KeyError:

1367

pass

1368

return

1369

for key in keys:

1370

# sanity check

1371

if key[0] is None:

1372

raise errors.BadIndexKey(key)

1373

if len(key) != self._key_length:

1374

raise errors.BadIndexKey(key)

1375

# find what it refers to:

1376

key_dict = nodes_by_key

1377

elements = list(key)

1378

# find the subdict whose contents should be returned.

1379

try:

1380

while len(elements) and elements[0] is not None:

1381

key_dict = key_dict[elements[0]]

1382

elements.pop(0)

1383

except KeyError:

1384

# a non-existant lookup.

1385

continue

1386

if len(elements):

1387

dicts = [key_dict]

1388

while dicts:

1389

key_dict = dicts.pop(-1)

1390

# can't be empty or would not exist

1391

item, value = key_dict.iteritems().next()

1392

if type(value) == dict:

1393

# push keys

1394

dicts.extend(key_dict.itervalues())

1395

else:

1396

# yield keys

1397

for value in key_dict.itervalues():

1398

# each value is the key:value:node refs tuple

1399

# ready to yield.

1400

yield (self, ) + value

1401

else:

1402

# the last thing looked up was a terminal element

1403

yield (self, ) + key_dict

1404

1405

def key_count(self):

1406

"""Return an estimate of the number of keys in this index.

1407

1408

For BTreeGraphIndex the estimate is exact as it is contained in the

1409

header.

1410

"""

1411

if self._key_count is None:

1412

self._get_root_node()

1413

return self._key_count

1414

1415

def _compute_row_offsets(self):

1416

"""Fill out the _row_offsets attribute based on _row_lengths."""

1417

offsets = []

1418

row_offset = 0

1419

for row in self._row_lengths:

1420

offsets.append(row_offset)

1421

row_offset += row

1422

offsets.append(row_offset)

1423

self._row_offsets = offsets

1424

1425

def _parse_header_from_bytes(self, bytes):

1426

"""Parse the header from a region of bytes.

1427

1428

:param bytes: The data to parse.

1429

:return: An offset, data tuple such as readv yields, for the unparsed

1430

data. (which may be of length 0).

1431

"""

1432

signature = bytes[0:len(self._signature())]

1433

if not signature == self._signature():

1434

raise errors.BadIndexFormatSignature(self._name, BTreeGraphIndex)

1435

lines = bytes[len(self._signature()):].splitlines()

1436

options_line = lines[0]

1437

if not options_line.startswith(_OPTION_NODE_REFS):

1438

raise errors.BadIndexOptions(self)

1439

try:

1440

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

1441

except ValueError:

1442

raise errors.BadIndexOptions(self)

1443

options_line = lines[1]

1444

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

1445

raise errors.BadIndexOptions(self)

1446

try:

1447

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

1448

except ValueError:

1449

raise errors.BadIndexOptions(self)

1450

options_line = lines[2]

1451

if not options_line.startswith(_OPTION_LEN):

1452

raise errors.BadIndexOptions(self)

1453

try:

1454

self._key_count = int(options_line[len(_OPTION_LEN):])

1455

except ValueError:

1456

raise errors.BadIndexOptions(self)

1457

options_line = lines[3]

1458

if not options_line.startswith(_OPTION_ROW_LENGTHS):

1459

raise errors.BadIndexOptions(self)

1460

try:

1461

self._row_lengths = map(int, [length for length in

1462

options_line[len(_OPTION_ROW_LENGTHS):].split(',')

1463

if len(length)])

1464

except ValueError:

1465

raise errors.BadIndexOptions(self)

1466

self._compute_row_offsets()

1467

1468

# calculate the bytes we have processed

1469

header_end = (len(signature) + sum(map(len, lines[0:4])) + 4)

1470

return header_end, bytes[header_end:]

1471

1472

def _read_nodes(self, nodes):

1473

"""Read some nodes from disk into the LRU cache.

1474

1475

This performs a readv to get the node data into memory, and parses each

1476

node, then yields it to the caller. The nodes are requested in the

1477

supplied order. If possible doing sort() on the list before requesting

1478

a read may improve performance.

1479

1480

:param nodes: The nodes to read. 0 - first node, 1 - second node etc.

1481

:return: None

1482

"""

1483

# may be the byte string of the whole file

1484

bytes = None

1485

# list of (offset, length) regions of the file that should, evenually

1486

# be read in to data_ranges, either from 'bytes' or from the transport

1487

ranges = []

1488

for index in nodes:

1489

offset = index * _PAGE_SIZE

1490

size = _PAGE_SIZE

1491

if index == 0:

1492

# Root node - special case

1493

if self._size:

1494

size = min(_PAGE_SIZE, self._size)

1495

else:

1496

# The only case where we don't know the size, is for very

1497

# small indexes. So we read the whole thing

1498

bytes = self._transport.get_bytes(self._name)

1499

self._size = len(bytes)

1500

# the whole thing should be parsed out of 'bytes'

1501

ranges.append((0, len(bytes)))

1502

break

1503

else:

1504

if offset > self._size:

1505

raise AssertionError('tried to read past the end'

1506

' of the file %s > %s'

1507

% (offset, self._size))

1508

size = min(size, self._size - offset)

1509

ranges.append((offset, size))

1510

if not ranges:

1511

return

1512

elif bytes is not None:

1513

# already have the whole file

1514

data_ranges = [(start, bytes[start:start+_PAGE_SIZE])

1515

for start in xrange(0, len(bytes), _PAGE_SIZE)]

1516

elif self._file is None:

1517

data_ranges = self._transport.readv(self._name, ranges)

1518

else:

1519

data_ranges = []

1520

for offset, size in ranges:

1521

self._file.seek(offset)

1522

data_ranges.append((offset, self._file.read(size)))

1523

for offset, data in data_ranges:

1524

if offset == 0:

1525

# extract the header

1526

offset, data = self._parse_header_from_bytes(data)

1527

if len(data) == 0:

1528

continue

1529

bytes = zlib.decompress(data)

1530

if bytes.startswith(_LEAF_FLAG):

1531

node = _LeafNode(bytes, self._key_length, self.node_ref_lists)

1532

elif bytes.startswith(_INTERNAL_FLAG):

1533

node = _InternalNode(bytes)

1534

else:

1535

raise AssertionError("Unknown node type for %r" % bytes)

1536

yield offset / _PAGE_SIZE, node

1537

1538

def _signature(self):

1539

"""The file signature for this index type."""

1540

return _BTSIGNATURE

1541

1542

def validate(self):

1543

"""Validate that everything in the index can be accessed."""

1544

# just read and parse every node.

1545

self._get_root_node()

1546

if len(self._row_lengths) > 1:

1547

start_node = self._row_offsets[1]

1548

else:

1549

# We shouldn't be reading anything anyway

1550

start_node = 1

1551

node_end = self._row_offsets[-1]

1552

for node in self._read_nodes(range(start_node, node_end)):

1553

pass

1554

1555

1556

try:

1557

from bzrlib import _btree_serializer_pyx as _btree_serializer

1558

except ImportError, e:

1559

osutils.failed_to_load_extension(e)

1560

from bzrlib import _btree_serializer_py as _btree_serializer

Older »