/brz/remove-bazaar : revision 3644.2.10

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: John Arbash Meinel
Date: 2008-08-28 20:13:31 UTC
mfrom: (3658 +trunk)
mto: This revision was merged to the branch mainline in revision 3688.
Revision ID: john@arbash-meinel.com-20080828201331-dqffxf54l2heokll

Merge bzr.dev 3658

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_walkdirs_win32.h

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chunk_writer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_add_fallback_repository.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_get_parent_map.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/developer-guide/testing.txt

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""B+Tree indices"""

import array

import bisect

from bisect import bisect_right

from copy import deepcopy

import math

import sha

import struct

import tempfile

import zlib

from bzrlib import (

chunk_writer,

debug,

errors,

index,

lru_cache,

osutils,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

from bzrlib.transport import get_transport

_BTSIGNATURE = "B+Tree Graph Index 2\n"

_OPTION_ROW_LENGTHS = "row_lengths="

_LEAF_FLAG = "type=leaf\n"

_INTERNAL_FLAG = "type=internal\n"

_INTERNAL_OFFSET = "offset="

_RESERVED_HEADER_BYTES = 120

_PAGE_SIZE = 4096

# 4K per page: 4MB - 1000 entries

_NODE_CACHE_SIZE = 1000

class _BuilderRow(object):

"""The stored state accumulated while writing out a row in the index.

:ivar spool: A temporary file used to accumulate nodes for this row

in the tree.

:ivar nodes: The count of nodes emitted so far.

"""

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = tempfile.TemporaryFile()

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

skipped_bytes = padding

self.spool.writelines(byte_lines)

remainder = (self.spool.tell() + skipped_bytes) % _PAGE_SIZE

if remainder != 0:

raise AssertionError("incorrect node length: %d, %d"

% (self.spool.tell(), remainder))

self.nodes += 1

self.writer = None

class _InternalBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out internal rows."""

def finish_node(self, pad=True):

if not pad:

raise AssertionError("Must pad internal nodes only.")

_BuilderRow.finish_node(self)

class _LeafBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out a leaf rows."""

100

101

class BTreeBuilder(index.GraphIndexBuilder):

102

"""A Builder for B+Tree based Graph indices.

103

104

The resulting graph has the structure:

105

106

_SIGNATURE OPTIONS NODES

107

_SIGNATURE := 'B+Tree Graph Index 1' NEWLINE

108

OPTIONS := REF_LISTS KEY_ELEMENTS LENGTH

109

REF_LISTS := 'node_ref_lists=' DIGITS NEWLINE

110

KEY_ELEMENTS := 'key_elements=' DIGITS NEWLINE

111

LENGTH := 'len=' DIGITS NEWLINE

112

ROW_LENGTHS := 'row_lengths' DIGITS (COMMA DIGITS)*

113

NODES := NODE_COMPRESSED*

114

NODE_COMPRESSED:= COMPRESSED_BYTES{4096}

115

NODE_RAW := INTERNAL | LEAF

116

INTERNAL := INTERNAL_FLAG POINTERS

117

LEAF := LEAF_FLAG ROWS

118

KEY_ELEMENT := Not-whitespace-utf8

119

KEY := KEY_ELEMENT (NULL KEY_ELEMENT)*

120

ROWS := ROW*

121

ROW := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

122

ABSENT := 'a'

123

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

124

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

125

REFERENCE := KEY

126

VALUE := no-newline-no-null-bytes

127

"""

128

129

def __init__(self, reference_lists=0, key_elements=1, spill_at=100000):

130

"""See GraphIndexBuilder.__init__.

131

132

:param spill_at: Optional parameter controlling the maximum number

133

of nodes that BTreeBuilder will hold in memory.

134

"""

135

index.GraphIndexBuilder.__init__(self, reference_lists=reference_lists,

136

key_elements=key_elements)

137

self._spill_at = spill_at

138

self._backing_indices = []

139

# Indicate it hasn't been built yet

140

self._nodes_by_key = None

141

142

def add_node(self, key, value, references=()):

143

"""Add a node to the index.

144

145

If adding the node causes the builder to reach its spill_at threshold,

146

disk spilling will be triggered.

147

148

:param key: The key. keys are non-empty tuples containing

149

as many whitespace-free utf8 bytestrings as the key length

150

defined for this index.

151

:param references: An iterable of iterables of keys. Each is a

152

reference to another key.

153

:param value: The value to associate with the key. It may be any

154

bytes as long as it does not contain \0 or \n.

155

"""

156

# we don't care about absent_references

157

node_refs, _ = self._check_key_ref_value(key, references, value)

158

if key in self._nodes:

159

raise errors.BadIndexDuplicateKey(key, self)

160

self._nodes[key] = (tuple(node_refs), value)

161

self._keys.add(key)

162

if self._nodes_by_key is not None and self._key_length > 1:

163

self._update_nodes_by_key(key, value, node_refs)

164

if len(self._keys) < self._spill_at:

165

return

166

self._spill_mem_keys_to_disk()

167

168

def _spill_mem_keys_to_disk(self):

169

"""Write the in memory keys down to disk to cap memory consumption.

170

171

If we already have some keys written to disk, we will combine them so

172

as to preserve the sorted order. The algorithm for combining uses

173

powers of two. So on the first spill, write all mem nodes into a

174

single index. On the second spill, combine the mem nodes with the nodes

175

on disk to create a 2x sized disk index and get rid of the first index.

176

On the third spill, create a single new disk index, which will contain

177

the mem nodes, and preserve the existing 2x sized index. On the fourth,

178

combine mem with the first and second indexes, creating a new one of

179

size 4x. On the fifth create a single new one, etc.

180

"""

181

iterators_to_combine = [self._iter_mem_nodes()]

182

pos = -1

183

for pos, backing in enumerate(self._backing_indices):

184

if backing is None:

185

pos -= 1

186

break

187

iterators_to_combine.append(backing.iter_all_entries())

188

backing_pos = pos + 1

189

new_backing_file, size = \

190

self._write_nodes(self._iter_smallest(iterators_to_combine))

191

dir_path, base_name = osutils.split(new_backing_file.name)

192

# Note: The transport here isn't strictly needed, because we will use

193

# direct access to the new_backing._file object

194

new_backing = BTreeGraphIndex(get_transport(dir_path),

195

base_name, size)

196

# GC will clean up the file

197

new_backing._file = new_backing_file

198

if len(self._backing_indices) == backing_pos:

199

self._backing_indices.append(None)

200

self._backing_indices[backing_pos] = new_backing

201

for pos in range(backing_pos):

202

self._backing_indices[pos] = None

203

self._keys = set()

204

self._nodes = {}

205

self._nodes_by_key = None

206

207

def add_nodes(self, nodes):

208

"""Add nodes to the index.

209

210

:param nodes: An iterable of (key, node_refs, value) entries to add.

211

"""

212

if self.reference_lists:

213

for (key, value, node_refs) in nodes:

214

self.add_node(key, value, node_refs)

215

else:

216

for (key, value) in nodes:

217

self.add_node(key, value)

218

219

def _iter_mem_nodes(self):

220

"""Iterate over the nodes held in memory."""

221

nodes = self._nodes

222

if self.reference_lists:

223

for key in sorted(nodes):

224

references, value = nodes[key]

225

yield self, key, value, references

226

else:

227

for key in sorted(nodes):

228

references, value = nodes[key]

229

yield self, key, value

230

231

def _iter_smallest(self, iterators_to_combine):

232

if len(iterators_to_combine) == 1:

233

for value in iterators_to_combine[0]:

234

yield value

235

return

236

current_values = []

237

for iterator in iterators_to_combine:

238

try:

239

current_values.append(iterator.next())

240

except StopIteration:

241

current_values.append(None)

242

last = None

243

while True:

244

# Decorate candidates with the value to allow 2.4's min to be used.

245

candidates = [(item[1][1], item) for item

246

in enumerate(current_values) if item[1] is not None]

247

if not len(candidates):

248

return

249

selected = min(candidates)

250

# undecorate back to (pos, node)

251

selected = selected[1]

252

if last == selected[1][1]:

253

raise errors.BadIndexDuplicateKey(last, self)

254

last = selected[1][1]

255

# Yield, with self as the index

256

yield (self,) + selected[1][1:]

257

pos = selected[0]

258

try:

259

current_values[pos] = iterators_to_combine[pos].next()

260

except StopIteration:

261

current_values[pos] = None

262

263

def _add_key(self, string_key, line, rows):

264

"""Add a key to the current chunk.

265

266

:param string_key: The key to add.

267

:param line: The fully serialised key and value.

268

"""

269

if rows[-1].writer is None:

270

# opening a new leaf chunk;

271

for pos, internal_row in enumerate(rows[:-1]):

272

# flesh out any internal nodes that are needed to

273

# preserve the height of the tree

274

if internal_row.writer is None:

275

length = _PAGE_SIZE

276

if internal_row.nodes == 0:

277

length -= _RESERVED_HEADER_BYTES # padded

278

internal_row.writer = chunk_writer.ChunkWriter(length, 0)

279

internal_row.writer.write(_INTERNAL_FLAG)

280

internal_row.writer.write(_INTERNAL_OFFSET +

281

str(rows[pos + 1].nodes) + "\n")

282

# add a new leaf

283

length = _PAGE_SIZE

284

if rows[-1].nodes == 0:

285

length -= _RESERVED_HEADER_BYTES # padded

286

rows[-1].writer = chunk_writer.ChunkWriter(length)

287

rows[-1].writer.write(_LEAF_FLAG)

288

if rows[-1].writer.write(line):

289

# this key did not fit in the node:

290

rows[-1].finish_node()

291

key_line = string_key + "\n"

292

new_row = True

293

for row in reversed(rows[:-1]):

294

# Mark the start of the next node in the node above. If it

295

# doesn't fit then propogate upwards until we find one that

296

# it does fit into.

297

if row.writer.write(key_line):

298

row.finish_node()

299

else:

300

# We've found a node that can handle the pointer.

301

new_row = False

302

break

303

# If we reached the current root without being able to mark the

304

# division point, then we need a new root:

305

if new_row:

306

# We need a new row

307

if 'index' in debug.debug_flags:

308

trace.mutter('Inserting new global row.')

309

new_row = _InternalBuilderRow()

310

reserved_bytes = 0

311

rows.insert(0, new_row)

312

# This will be padded, hence the -100

313

new_row.writer = chunk_writer.ChunkWriter(

314

_PAGE_SIZE - _RESERVED_HEADER_BYTES,

315

reserved_bytes)

316

new_row.writer.write(_INTERNAL_FLAG)

317

new_row.writer.write(_INTERNAL_OFFSET +

318

str(rows[1].nodes - 1) + "\n")

319

new_row.writer.write(key_line)

320

self._add_key(string_key, line, rows)

321

322

def _write_nodes(self, node_iterator):

323

"""Write node_iterator out as a B+Tree.

324

325

:param node_iterator: An iterator of sorted nodes. Each node should

326

match the output given by iter_all_entries.

327

:return: A file handle for a temporary file containing a B+Tree for

328

the nodes.

329

"""

330

# The index rows - rows[0] is the root, rows[1] is the layer under it

331

# etc.

332

rows = []

333

# forward sorted by key. In future we may consider topological sorting,

334

# at the cost of table scans for direct lookup, or a second index for

335

# direct lookup

336

key_count = 0

337

# A stack with the number of nodes of each size. 0 is the root node

338

# and must always be 1 (if there are any nodes in the tree).

339

self.row_lengths = []

340

# Loop over all nodes adding them to the bottom row

341

# (rows[-1]). When we finish a chunk in a row,

342

# propogate the key that didn't fit (comes after the chunk) to the

343

# row above, transitively.

344

for node in node_iterator:

345

if key_count == 0:

346

# First key triggers the first row

347

rows.append(_LeafBuilderRow())

348

key_count += 1

349

# TODO: Flattening the node into a string key and a line should

350

# probably be put into a pyrex function. We can do a quick

351

# iter over all the entries to determine the final length,

352

# and then do a single malloc() rather than lots of

353

# intermediate mallocs as we build everything up.

354

# ATM 3 / 13s are spent flattening nodes (10s is compressing)

355

string_key, line = _btree_serializer._flatten_node(node,

356

self.reference_lists)

357

self._add_key(string_key, line, rows)

358

for row in reversed(rows):

359

pad = (type(row) != _LeafBuilderRow)

360

row.finish_node(pad=pad)

361

result = tempfile.NamedTemporaryFile()

362

lines = [_BTSIGNATURE]

363

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

364

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

365

lines.append(_OPTION_LEN + str(key_count) + '\n')

366

row_lengths = [row.nodes for row in rows]

367

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

368

result.writelines(lines)

369

position = sum(map(len, lines))

370

root_row = True

371

if position > _RESERVED_HEADER_BYTES:

372

raise AssertionError("Could not fit the header in the"

373

" reserved space: %d > %d"

374

% (position, _RESERVED_HEADER_BYTES))

375

# write the rows out:

376

for row in rows:

377

reserved = _RESERVED_HEADER_BYTES # reserved space for first node

378

row.spool.flush()

379

row.spool.seek(0)

380

# copy nodes to the finalised file.

381

# Special case the first node as it may be prefixed

382

node = row.spool.read(_PAGE_SIZE)

383

result.write(node[reserved:])

384

result.write("\x00" * (reserved - position))

385

position = 0 # Only the root row actually has an offset

386

copied_len = osutils.pumpfile(row.spool, result)

387

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

388

if type(row) != _LeafBuilderRow:

389

raise AssertionError("Incorrect amount of data copied"

390

" expected: %d, got: %d"

391

% ((row.nodes - 1) * _PAGE_SIZE,

392

copied_len))

393

result.flush()

394

size = result.tell()

395

result.seek(0)

396

return result, size

397

398

def finish(self):

399

"""Finalise the index.

400

401

:return: A file handle for a temporary file containing the nodes added

402

to the index.

403

"""

404

return self._write_nodes(self.iter_all_entries())[0]

405

406

def iter_all_entries(self):

407

"""Iterate over all keys within the index

408

409

:return: An iterable of (index, key, reference_lists, value). There is no

410

defined order for the result iteration - it will be in the most

411

efficient order for the index (in this case dictionary hash order).

412

"""

413

if 'evil' in debug.debug_flags:

414

trace.mutter_callsite(3,

415

"iter_all_entries scales with size of history.")

416

# Doing serial rather than ordered would be faster; but this shouldn't

417

# be getting called routinely anyway.

418

iterators = [self._iter_mem_nodes()]

419

for backing in self._backing_indices:

420

if backing is not None:

421

iterators.append(backing.iter_all_entries())

422

if len(iterators) == 1:

423

return iterators[0]

424

return self._iter_smallest(iterators)

425

426

def iter_entries(self, keys):

427

"""Iterate over keys within the index.

428

429

:param keys: An iterable providing the keys to be retrieved.

430

:return: An iterable of (index, key, value, reference_lists). There is no

431

defined order for the result iteration - it will be in the most

432

efficient order for the index (keys iteration order in this case).

433

"""

434

keys = set(keys)

435

if self.reference_lists:

436

for key in keys.intersection(self._keys):

437

node = self._nodes[key]

438

yield self, key, node[1], node[0]

439

else:

440

for key in keys.intersection(self._keys):

441

node = self._nodes[key]

442

yield self, key, node[1]

443

keys.difference_update(self._keys)

444

for backing in self._backing_indices:

445

if backing is None:

446

continue

447

if not keys:

448

return

449

for node in backing.iter_entries(keys):

450

keys.remove(node[1])

451

yield (self,) + node[1:]

452

453

def iter_entries_prefix(self, keys):

454

"""Iterate over keys within the index using prefix matching.

455

456

Prefix matching is applied within the tuple of a key, not to within

457

the bytestring of each key element. e.g. if you have the keys ('foo',

458

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

459

only the former key is returned.

460

461

:param keys: An iterable providing the key prefixes to be retrieved.

462

Each key prefix takes the form of a tuple the length of a key, but

463

with the last N elements 'None' rather than a regular bytestring.

464

The first element cannot be 'None'.

465

:return: An iterable as per iter_all_entries, but restricted to the

466

keys with a matching prefix to those supplied. No additional keys

467

will be returned, and every match that is in the index will be

468

returned.

469

"""

470

# XXX: To much duplication with the GraphIndex class; consider finding

471

# a good place to pull out the actual common logic.

472

keys = set(keys)

473

if not keys:

474

return

475

for backing in self._backing_indices:

476

if backing is None:

477

continue

478

for node in backing.iter_entries_prefix(keys):

479

# TODO: We should probably remove yielded keys from the keys

480

# list

481

yield (self,) + node[1:]

482

if self._key_length == 1:

483

for key in keys:

484

# sanity check

485

if key[0] is None:

486

raise errors.BadIndexKey(key)

487

if len(key) != self._key_length:

488

raise errors.BadIndexKey(key)

489

try:

490

node = self._nodes[key]

491

except KeyError:

492

continue

493

if self.reference_lists:

494

yield self, key, node[1], node[0]

495

else:

496

yield self, key, node[1]

497

return

498

for key in keys:

499

# sanity check

500

if key[0] is None:

501

raise errors.BadIndexKey(key)

502

if len(key) != self._key_length:

503

raise errors.BadIndexKey(key)

504

# find what it refers to:

505

key_dict = self._get_nodes_by_key()

506

elements = list(key)

507

# find the subdict to return

508

try:

509

while len(elements) and elements[0] is not None:

510

key_dict = key_dict[elements[0]]

511

elements.pop(0)

512

except KeyError:

513

# a non-existant lookup.

514

continue

515

if len(elements):

516

dicts = [key_dict]

517

while dicts:

518

key_dict = dicts.pop(-1)

519

# can't be empty or would not exist

520

item, value = key_dict.iteritems().next()

521

if type(value) == dict:

522

# push keys

523

dicts.extend(key_dict.itervalues())

524

else:

525

# yield keys

526

for value in key_dict.itervalues():

527

yield (self, ) + value

528

else:

529

yield (self, ) + key_dict

530

531

def _get_nodes_by_key(self):

532

if self._nodes_by_key is None:

533

nodes_by_key = {}

534

if self.reference_lists:

535

for key, (references, value) in self._nodes.iteritems():

536

key_dict = nodes_by_key

537

for subkey in key[:-1]:

538

key_dict = key_dict.setdefault(subkey, {})

539

key_dict[key[-1]] = key, value, references

540

else:

541

for key, (references, value) in self._nodes.iteritems():

542

key_dict = nodes_by_key

543

for subkey in key[:-1]:

544

key_dict = key_dict.setdefault(subkey, {})

545

key_dict[key[-1]] = key, value

546

self._nodes_by_key = nodes_by_key

547

return self._nodes_by_key

548

549

def key_count(self):

550

"""Return an estimate of the number of keys in this index.

551

552

For InMemoryGraphIndex the estimate is exact.

553

"""

554

return len(self._keys) + sum(backing.key_count() for backing in

555

self._backing_indices if backing is not None)

556

557

def validate(self):

558

"""In memory index's have no known corruption at the moment."""

559

560

561

class _LeafNode(object):

562

"""A leaf node for a serialised B+Tree index."""

563

564

def __init__(self, bytes, key_length, ref_list_length):

565

"""Parse bytes to create a leaf node object."""

566

# splitlines mangles the \r delimiters.. don't use it.

567

self.keys = dict(_btree_serializer._parse_leaf_lines(bytes,

568

key_length, ref_list_length))

569

570

571

class _InternalNode(object):

572

"""An internal node for a serialised B+Tree index."""

573

574

def __init__(self, bytes):

575

"""Parse bytes to create an internal node object."""

576

# splitlines mangles the \r delimiters.. don't use it.

577

self.keys = self._parse_lines(bytes.split('\n'))

578

579

def _parse_lines(self, lines):

580

nodes = []

581

self.offset = int(lines[1][7:])

582

for line in lines[2:]:

583

if line == '':

584

break

585

nodes.append(tuple(line.split('\0')))

586

return nodes

587

588

589

class BTreeGraphIndex(object):

590

"""Access to nodes via the standard GraphIndex interface for B+Tree's.

591

592

Individual nodes are held in a LRU cache. This holds the root node in

593

memory except when very large walks are done.

594

"""

595

596

def __init__(self, transport, name, size):

597

"""Create a B+Tree index object on the index name.

598

599

:param transport: The transport to read data for the index from.

600

:param name: The file name of the index on transport.

601

:param size: Optional size of the index in bytes. This allows

602

compatibility with the GraphIndex API, as well as ensuring that

603

the initial read (to read the root node header) can be done

604

without over-reading even on empty indices, and on small indices

605

allows single-IO to read the entire index.

606

"""

607

self._transport = transport

608

self._name = name

609

self._size = size

610

self._file = None

611

self._page_size = transport.recommended_page_size()

612

self._root_node = None

613

# Default max size is 100,000 leave values

614

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

615

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

616

self._internal_node_cache = lru_cache.LRUCache()

617

self._key_count = None

618

self._row_lengths = None

619

self._row_offsets = None # Start of each row, [-1] is the end

620

621

def __eq__(self, other):

622

"""Equal when self and other were created with the same parameters."""

623

return (

624

type(self) == type(other) and

625

self._transport == other._transport and

626

self._name == other._name and

627

self._size == other._size)

628

629

def __ne__(self, other):

630

return not self.__eq__(other)

631

632

def _get_root_node(self):

633

if self._root_node is None:

634

# We may not have a root node yet

635

nodes = list(self._read_nodes([0]))

636

if len(nodes):

637

self._root_node = nodes[0][1]

638

return self._root_node

639

640

def _cache_nodes(self, nodes, cache):

641

"""Read nodes and cache them in the lru.

642

643

The nodes list supplied is sorted and then read from disk, each node

644

being inserted it into the _node_cache.

645

646

Note: Asking for more nodes than the _node_cache can contain will

647

result in some of the results being immediately discarded, to prevent

648

this an assertion is raised if more nodes are asked for than are

649

cachable.

650

651

:return: A dict of {node_pos: node}

652

"""

653

if len(nodes) > cache._max_cache:

654

trace.mutter('Requesting %s > %s nodes, not all will be cached',

655

len(nodes), cache._max_cache)

656

found = {}

657

for node_pos, node in self._read_nodes(sorted(nodes)):

658

if node_pos == 0: # Special case

659

self._root_node = node

660

else:

661

cache.add(node_pos, node)

662

found[node_pos] = node

663

return found

664

665

def _get_nodes(self, cache, node_indexes):

666

found = {}

667

needed = []

668

for idx in node_indexes:

669

if idx == 0 and self._root_node is not None:

670

found[0] = self._root_node

671

continue

672

try:

673

found[idx] = cache[idx]

674

except KeyError:

675

needed.append(idx)

676

found.update(self._cache_nodes(needed, cache))

677

return found

678

679

def _get_internal_nodes(self, node_indexes):

680

"""Get a node, from cache or disk.

681

682

After getting it, the node will be cached.

683

"""

684

return self._get_nodes(self._internal_node_cache, node_indexes)

685

686

def _get_leaf_nodes(self, node_indexes):

687

"""Get a bunch of nodes, from cache or disk."""

688

found = self._get_nodes(self._leaf_node_cache, node_indexes)

689

if self._leaf_value_cache is not None:

690

for node in found.itervalues():

691

for key, value in node.keys.iteritems():

692

if key in self._leaf_value_cache:

693

# Don't add the rest of the keys, we've seen this node

694

# before.

695

break

696

self._leaf_value_cache[key] = value

697

return found

698

699

def iter_all_entries(self):

700

"""Iterate over all keys within the index.

701

702

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

703

The former tuple is used when there are no reference lists in the

704

index, making the API compatible with simple key:value index types.

705

There is no defined order for the result iteration - it will be in

706

the most efficient order for the index.

707

"""

708

if 'evil' in debug.debug_flags:

709

trace.mutter_callsite(3,

710

"iter_all_entries scales with size of history.")

711

if not self.key_count():

712

return

713

start_of_leaves = self._row_offsets[-2]

714

end_of_leaves = self._row_offsets[-1]

715

needed_nodes = range(start_of_leaves, end_of_leaves)

716

# We iterate strictly in-order so that we can use this function

717

# for spilling index builds to disk.

718

if self.node_ref_lists:

719

for _, node in self._read_nodes(needed_nodes):

720

for key, (value, refs) in sorted(node.keys.items()):

721

yield (self, key, value, refs)

722

else:

723

for _, node in self._read_nodes(needed_nodes):

724

for key, (value, refs) in sorted(node.keys.items()):

725

yield (self, key, value)

726

727

@staticmethod

728

def _multi_bisect_right(in_keys, fixed_keys):

729

"""Find the positions where each 'in_key' would fit in fixed_keys.

730

731

This is equivalent to doing "bisect_right" on each in_key into

732

fixed_keys

733

734

:param in_keys: A sorted list of keys to match with fixed_keys

735

:param fixed_keys: A sorted list of keys to match against

736

:return: A list of (integer position, [key list]) tuples.

737

"""

738

if not in_keys:

739

return []

740

if not fixed_keys:

741

# no pointers in the fixed_keys list, which means everything must

742

# fall to the left.

743

return [(0, in_keys)]

744

745

# TODO: Iterating both lists will generally take M + N steps

746

# Bisecting each key will generally take M * log2 N steps.

747

# If we had an efficient way to compare, we could pick the method

748

# based on which has the fewer number of steps.

749

# There is also the argument that bisect_right is a compiled

750

# function, so there is even more to be gained.

751

# iter_steps = len(in_keys) + len(fixed_keys)

752

# bisect_steps = len(in_keys) * math.log(len(fixed_keys), 2)

753

if len(in_keys) == 1: # Bisect will always be faster for M = 1

754

return [(bisect_right(fixed_keys, in_keys[0]), in_keys)]

755

# elif bisect_steps < iter_steps:

756

# offsets = {}

757

# for key in in_keys:

758

# offsets.setdefault(bisect_right(fixed_keys, key),

759

# []).append(key)

760

# return [(o, offsets[o]) for o in sorted(offsets)]

761

in_keys_iter = iter(in_keys)

762

fixed_keys_iter = enumerate(fixed_keys)

763

cur_in_key = in_keys_iter.next()

764

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

765

766

class InputDone(Exception): pass

767

class FixedDone(Exception): pass

768

769

output = []

770

cur_out = []

771

772

# TODO: Another possibility is that rather than iterating on each side,

773

# we could use a combination of bisecting and iterating. For

774

# example, while cur_in_key < fixed_key, bisect to find its

775

# point, then iterate all matching keys, then bisect (restricted

776

# to only the remainder) for the next one, etc.

777

try:

778

while True:

779

if cur_in_key < cur_fixed_key:

780

cur_keys = []

781

cur_out = (cur_fixed_offset, cur_keys)

782

output.append(cur_out)

783

while cur_in_key < cur_fixed_key:

784

cur_keys.append(cur_in_key)

785

try:

786

cur_in_key = in_keys_iter.next()

787

except StopIteration:

788

raise InputDone

789

# At this point cur_in_key must be >= cur_fixed_key

790

# step the cur_fixed_key until we pass the cur key, or walk off

791

# the end

792

while cur_in_key >= cur_fixed_key:

793

try:

794

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

795

except StopIteration:

796

raise FixedDone

797

except InputDone:

798

# We consumed all of the input, nothing more to do

799

pass

800

except FixedDone:

801

# There was some input left, but we consumed all of fixed, so we

802

# have to add one more for the tail

803

cur_keys = [cur_in_key]

804

cur_keys.extend(in_keys_iter)

805

cur_out = (len(fixed_keys), cur_keys)

806

output.append(cur_out)

807

return output

808

809

def iter_entries(self, keys):

810

"""Iterate over keys within the index.

811

812

:param keys: An iterable providing the keys to be retrieved.

813

:return: An iterable as per iter_all_entries, but restricted to the

814

keys supplied. No additional keys will be returned, and every

815

key supplied that is in the index will be returned.

816

"""

817

# 6 seconds spent in miss_torture using the sorted() line.

818

# Even with out of order disk IO it seems faster not to sort it when

819

# large queries are being made.

820

# However, now that we are doing multi-way bisecting, we need the keys

821

# in sorted order anyway. We could change the multi-way code to not

822

# require sorted order. (For example, it bisects for the first node,

823

# does an in-order search until a key comes before the current point,

824

# which it then bisects for, etc.)

825

keys = frozenset(keys)

826

if not keys:

827

return

828

829

if not self.key_count():

830

return

831

832

needed_keys = []

833

if self._leaf_value_cache is None:

834

needed_keys = keys

835

else:

836

for key in keys:

837

value = self._leaf_value_cache.get(key, None)

838

if value is not None:

839

# This key is known not to be here, skip it

840

value, refs = value

841

if self.node_ref_lists:

842

yield (self, key, value, refs)

843

else:

844

yield (self, key, value)

845

else:

846

needed_keys.append(key)

847

848

last_key = None

849

needed_keys = keys

850

if not needed_keys:

851

return

852

# 6 seconds spent in miss_torture using the sorted() line.

853

# Even with out of order disk IO it seems faster not to sort it when

854

# large queries are being made.

855

needed_keys = sorted(needed_keys)

856

857

nodes_and_keys = [(0, needed_keys)]

858

859

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

860

node_indexes = [idx for idx, s_keys in nodes_and_keys]

861

nodes = self._get_internal_nodes(node_indexes)

862

863

next_nodes_and_keys = []

864

for node_index, sub_keys in nodes_and_keys:

865

node = nodes[node_index]

866

positions = self._multi_bisect_right(sub_keys, node.keys)

867

node_offset = next_row_start + node.offset

868

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

869

for pos, s_keys in positions])

870

nodes_and_keys = next_nodes_and_keys

871

# We should now be at the _LeafNodes

872

node_indexes = [idx for idx, s_keys in nodes_and_keys]

873

874

# TODO: We may *not* want to always read all the nodes in one

875

# big go. Consider setting a max size on this.

876

877

nodes = self._get_leaf_nodes(node_indexes)

878

for node_index, sub_keys in nodes_and_keys:

879

if not sub_keys:

880

continue

881

node = nodes[node_index]

882

for next_sub_key in sub_keys:

883

if next_sub_key in node.keys:

884

value, refs = node.keys[next_sub_key]

885

if self.node_ref_lists:

886

yield (self, next_sub_key, value, refs)

887

else:

888

yield (self, next_sub_key, value)

889

890

def iter_entries_prefix(self, keys):

891

"""Iterate over keys within the index using prefix matching.

892

893

Prefix matching is applied within the tuple of a key, not to within

894

the bytestring of each key element. e.g. if you have the keys ('foo',

895

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

896

only the former key is returned.

897

898

WARNING: Note that this method currently causes a full index parse

899

unconditionally (which is reasonably appropriate as it is a means for

900

thunking many small indices into one larger one and still supplies

901

iter_all_entries at the thunk layer).

902

903

:param keys: An iterable providing the key prefixes to be retrieved.

904

Each key prefix takes the form of a tuple the length of a key, but

905

with the last N elements 'None' rather than a regular bytestring.

906

The first element cannot be 'None'.

907

:return: An iterable as per iter_all_entries, but restricted to the

908

keys with a matching prefix to those supplied. No additional keys

909

will be returned, and every match that is in the index will be

910

returned.

911

"""

912

keys = sorted(set(keys))

913

if not keys:

914

return

915

# Load if needed to check key lengths

916

if self._key_count is None:

917

self._get_root_node()

918

# TODO: only access nodes that can satisfy the prefixes we are looking

919

# for. For now, to meet API usage (as this function is not used by

920

# current bzrlib) just suck the entire index and iterate in memory.

921

nodes = {}

922

if self.node_ref_lists:

923

if self._key_length == 1:

924

for _1, key, value, refs in self.iter_all_entries():

925

nodes[key] = value, refs

926

else:

927

nodes_by_key = {}

928

for _1, key, value, refs in self.iter_all_entries():

929

key_value = key, value, refs

930

# For a key of (foo, bar, baz) create

931

# _nodes_by_key[foo][bar][baz] = key_value

932

key_dict = nodes_by_key

933

for subkey in key[:-1]:

934

key_dict = key_dict.setdefault(subkey, {})

935

key_dict[key[-1]] = key_value

936

else:

937

if self._key_length == 1:

938

for _1, key, value in self.iter_all_entries():

939

nodes[key] = value

940

else:

941

nodes_by_key = {}

942

for _1, key, value in self.iter_all_entries():

943

key_value = key, value

944

# For a key of (foo, bar, baz) create

945

# _nodes_by_key[foo][bar][baz] = key_value

946

key_dict = nodes_by_key

947

for subkey in key[:-1]:

948

key_dict = key_dict.setdefault(subkey, {})

949

key_dict[key[-1]] = key_value

950

if self._key_length == 1:

951

for key in keys:

952

# sanity check

953

if key[0] is None:

954

raise errors.BadIndexKey(key)

955

if len(key) != self._key_length:

956

raise errors.BadIndexKey(key)

957

try:

958

if self.node_ref_lists:

959

value, node_refs = nodes[key]

960

yield self, key, value, node_refs

961

else:

962

yield self, key, nodes[key]

963

except KeyError:

964

pass

965

return

966

for key in keys:

967

# sanity check

968

if key[0] is None:

969

raise errors.BadIndexKey(key)

970

if len(key) != self._key_length:

971

raise errors.BadIndexKey(key)

972

# find what it refers to:

973

key_dict = nodes_by_key

974

elements = list(key)

975

# find the subdict whose contents should be returned.

976

try:

977

while len(elements) and elements[0] is not None:

978

key_dict = key_dict[elements[0]]

979

elements.pop(0)

980

except KeyError:

981

# a non-existant lookup.

982

continue

983

if len(elements):

984

dicts = [key_dict]

985

while dicts:

986

key_dict = dicts.pop(-1)

987

# can't be empty or would not exist

988

item, value = key_dict.iteritems().next()

989

if type(value) == dict:

990

# push keys

991

dicts.extend(key_dict.itervalues())

992

else:

993

# yield keys

994

for value in key_dict.itervalues():

995

# each value is the key:value:node refs tuple

996

# ready to yield.

997

yield (self, ) + value

998

else:

999

# the last thing looked up was a terminal element

1000

yield (self, ) + key_dict

1001

1002

def key_count(self):

1003

"""Return an estimate of the number of keys in this index.

1004

1005

For BTreeGraphIndex the estimate is exact as it is contained in the

1006

header.

1007

"""

1008

if self._key_count is None:

1009

self._get_root_node()

1010

return self._key_count

1011

1012

def _parse_header_from_bytes(self, bytes):

1013

"""Parse the header from a region of bytes.

1014

1015

:param bytes: The data to parse.

1016

:return: An offset, data tuple such as readv yields, for the unparsed

1017

data. (which may be of length 0).

1018

"""

1019

signature = bytes[0:len(self._signature())]

1020

if not signature == self._signature():

1021

raise errors.BadIndexFormatSignature(self._name, BTreeGraphIndex)

1022

lines = bytes[len(self._signature()):].splitlines()

1023

options_line = lines[0]

1024

if not options_line.startswith(_OPTION_NODE_REFS):

1025

raise errors.BadIndexOptions(self)

1026

try:

1027

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

1028

except ValueError:

1029

raise errors.BadIndexOptions(self)

1030

options_line = lines[1]

1031

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

1032

raise errors.BadIndexOptions(self)

1033

try:

1034

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

1035

except ValueError:

1036

raise errors.BadIndexOptions(self)

1037

options_line = lines[2]

1038

if not options_line.startswith(_OPTION_LEN):

1039

raise errors.BadIndexOptions(self)

1040

try:

1041

self._key_count = int(options_line[len(_OPTION_LEN):])

1042

except ValueError:

1043

raise errors.BadIndexOptions(self)

1044

options_line = lines[3]

1045

if not options_line.startswith(_OPTION_ROW_LENGTHS):

1046

raise errors.BadIndexOptions(self)

1047

try:

1048

self._row_lengths = map(int, [length for length in

1049

options_line[len(_OPTION_ROW_LENGTHS):].split(',')

1050

if len(length)])

1051

except ValueError:

1052

raise errors.BadIndexOptions(self)

1053

offsets = []

1054

row_offset = 0

1055

for row in self._row_lengths:

1056

offsets.append(row_offset)

1057

row_offset += row

1058

offsets.append(row_offset)

1059

self._row_offsets = offsets

1060

1061

# calculate the bytes we have processed

1062

header_end = (len(signature) + sum(map(len, lines[0:4])) + 4)

1063

return header_end, bytes[header_end:]

1064

1065

def _read_nodes(self, nodes):

1066

"""Read some nodes from disk into the LRU cache.

1067

1068

This performs a readv to get the node data into memory, and parses each

1069

node, the yields it to the caller. The nodes are requested in the

1070

supplied order. If possible doing sort() on the list before requesting

1071

a read may improve performance.

1072

1073

:param nodes: The nodes to read. 0 - first node, 1 - second node etc.

1074

:return: None

1075

"""

1076

ranges = []

1077

for index in nodes:

1078

offset = index * _PAGE_SIZE

1079

size = _PAGE_SIZE

1080

if index == 0:

1081

# Root node - special case

1082

if self._size:

1083

size = min(_PAGE_SIZE, self._size)

1084

else:

1085

stream = self._transport.get(self._name)

1086

start = stream.read(_PAGE_SIZE)

1087

# Avoid doing this again

1088

self._size = len(start)

1089

size = min(_PAGE_SIZE, self._size)

1090

else:

1091

size = min(size, self._size - offset)

1092

ranges.append((offset, size))

1093

if not ranges:

1094

return

1095

if self._file is None:

1096

data_ranges = self._transport.readv(self._name, ranges)

1097

else:

1098

data_ranges = []

1099

for offset, size in ranges:

1100

self._file.seek(offset)

1101

data_ranges.append((offset, self._file.read(size)))

1102

for offset, data in data_ranges:

1103

if offset == 0:

1104

# extract the header

1105

offset, data = self._parse_header_from_bytes(data)

1106

if len(data) == 0:

1107

continue

1108

bytes = zlib.decompress(data)

1109

if bytes.startswith(_LEAF_FLAG):

1110

node = _LeafNode(bytes, self._key_length, self.node_ref_lists)

1111

elif bytes.startswith(_INTERNAL_FLAG):

1112

node = _InternalNode(bytes)

1113

else:

1114

raise AssertionError("Unknown node type for %r" % bytes)

1115

yield offset / _PAGE_SIZE, node

1116

1117

def _signature(self):

1118

"""The file signature for this index type."""

1119

return _BTSIGNATURE

1120

1121

def validate(self):

1122

"""Validate that everything in the index can be accessed."""

1123

# just read and parse every node.

1124

self._get_root_node()

1125

if len(self._row_lengths) > 1:

1126

start_node = self._row_offsets[1]

1127

else:

1128

# We shouldn't be reading anything anyway

1129

start_node = 1

1130

node_end = self._row_offsets[-1]

1131

for node in self._read_nodes(range(start_node, node_end)):

1132

pass

1133

1134

1135

try:

1136

from bzrlib import _btree_serializer_c as _btree_serializer

1137

except ImportError:

1138

from bzrlib import _btree_serializer_py as _btree_serializer

Older »