/brz/remove-bazaar : revision 4168.3.6

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: John Arbash Meinel
Date: 2009-03-23 19:35:38 UTC
mto: This revision was merged to the branch mainline in revision 4187.
Revision ID: john@arbash-meinel.com-20090323193538-3d01aetz07jsyd3w

Add 'combine_backing_indices' as a flag for GraphIndex.set_optimize().

Update the Packer code so that it sets combine_backing_indices=False, as we know that
we won't be making extra queries.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2-windows.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

doc/news-template.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

100

self._key_length = key_elements

101

self._optimize_for_size = False

102

self._combine_backing_indices = True

103

104

def _check_key(self, key):

105

"""Raise BadIndexKey if key is not a valid key for this index."""

106

if type(key) != tuple:

107

raise errors.BadIndexKey(key)

108

if self._key_length != len(key):

109

raise errors.BadIndexKey(key)

110

for element in key:

111

if not element or _whitespace_re.search(element) is not None:

112

raise errors.BadIndexKey(element)

113

114

def _external_references(self):

115

"""Return references that are not present in this index.

116

"""

117

keys = set()

118

refs = set()

119

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

120

# lists are used. It is currently correct for pack-0.92 through

121

# 1.9, which use the node references (3rd column) second

122

# reference list as the compression parent. Perhaps this should

123

# be moved into something higher up the stack, since it

124

# makes assumptions about how the index is used.

125

if self.reference_lists > 1:

126

for node in self.iter_all_entries():

127

keys.add(node[1])

128

refs.update(node[3][1])

129

return refs - keys

130

else:

131

# If reference_lists == 0 there can be no external references, and

132

# if reference_lists == 1, then there isn't a place to store the

133

# compression parent

134

return set()

135

136

def _get_nodes_by_key(self):

137

if self._nodes_by_key is None:

138

nodes_by_key = {}

139

if self.reference_lists:

140

for key, (absent, references, value) in self._nodes.iteritems():

141

if absent:

142

continue

143

key_dict = nodes_by_key

144

for subkey in key[:-1]:

145

key_dict = key_dict.setdefault(subkey, {})

146

key_dict[key[-1]] = key, value, references

147

else:

148

for key, (absent, references, value) in self._nodes.iteritems():

149

if absent:

150

continue

151

key_dict = nodes_by_key

152

for subkey in key[:-1]:

153

key_dict = key_dict.setdefault(subkey, {})

154

key_dict[key[-1]] = key, value

155

self._nodes_by_key = nodes_by_key

156

return self._nodes_by_key

157

158

def _update_nodes_by_key(self, key, value, node_refs):

159

"""Update the _nodes_by_key dict with a new key.

160

161

For a key of (foo, bar, baz) create

162

_nodes_by_key[foo][bar][baz] = key_value

163

"""

164

if self._nodes_by_key is None:

165

return

166

key_dict = self._nodes_by_key

167

if self.reference_lists:

168

key_value = key, value, node_refs

169

else:

170

key_value = key, value

171

for subkey in key[:-1]:

172

key_dict = key_dict.setdefault(subkey, {})

173

key_dict[key[-1]] = key_value

174

175

def _check_key_ref_value(self, key, references, value):

176

"""Check that 'key' and 'references' are all valid.

177

178

:param key: A key tuple. Must conform to the key interface (be a tuple,

179

be of the right length, not have any whitespace or nulls in any key

180

element.)

181

:param references: An iterable of reference lists. Something like

182

[[(ref, key)], [(ref, key), (other, key)]]

183

:param value: The value associate with this key. Must not contain

184

newlines or null characters.

185

:return: (node_refs, absent_references)

186

node_refs basically a packed form of 'references' where all

187

iterables are tuples

188

absent_references reference keys that are not in self._nodes.

189

This may contain duplicates if the same key is

190

referenced in multiple lists.

191

"""

192

self._check_key(key)

193

if _newline_null_re.search(value) is not None:

194

raise errors.BadIndexValue(value)

195

if len(references) != self.reference_lists:

196

raise errors.BadIndexValue(references)

197

node_refs = []

198

absent_references = []

199

for reference_list in references:

200

for reference in reference_list:

201

# If reference *is* in self._nodes, then we know it has already

202

# been checked.

203

if reference not in self._nodes:

204

self._check_key(reference)

205

absent_references.append(reference)

206

node_refs.append(tuple(reference_list))

207

return tuple(node_refs), absent_references

208

209

def add_node(self, key, value, references=()):

210

"""Add a node to the index.

211

212

:param key: The key. keys are non-empty tuples containing

213

as many whitespace-free utf8 bytestrings as the key length

214

defined for this index.

215

:param references: An iterable of iterables of keys. Each is a

216

reference to another key.

217

:param value: The value to associate with the key. It may be any

218

bytes as long as it does not contain \0 or \n.

219

"""

220

(node_refs,

221

absent_references) = self._check_key_ref_value(key, references, value)

222

if key in self._nodes and self._nodes[key][0] != 'a':

223

raise errors.BadIndexDuplicateKey(key, self)

224

for reference in absent_references:

225

# There may be duplicates, but I don't think it is worth worrying

226

# about

227

self._nodes[reference] = ('a', (), '')

228

self._nodes[key] = ('', node_refs, value)

229

self._keys.add(key)

230

if self._nodes_by_key is not None and self._key_length > 1:

231

self._update_nodes_by_key(key, value, node_refs)

232

233

def finish(self):

234

lines = [_SIGNATURE]

235

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

236

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

237

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

238

prefix_length = sum(len(x) for x in lines)

239

# references are byte offsets. To avoid having to do nasty

240

# polynomial work to resolve offsets (references to later in the

241

# file cannot be determined until all the inbetween references have

242

# been calculated too) we pad the offsets with 0's to make them be

243

# of consistent length. Using binary offsets would break the trivial

244

# file parsing.

245

# to calculate the width of zero's needed we do three passes:

246

# one to gather all the non-reference data and the number of references.

247

# one to pad all the data with reference-length and determine entry

248

# addresses.

249

# One to serialise.

250

251

# forward sorted by key. In future we may consider topological sorting,

252

# at the cost of table scans for direct lookup, or a second index for

253

# direct lookup

254

nodes = sorted(self._nodes.items())

255

# if we do not prepass, we don't know how long it will be up front.

256

expected_bytes = None

257

# we only need to pre-pass if we have reference lists at all.

258

if self.reference_lists:

259

key_offset_info = []

260

non_ref_bytes = prefix_length

261

total_references = 0

262

# TODO use simple multiplication for the constants in this loop.

263

for key, (absent, references, value) in nodes:

264

# record the offset known *so far* for this key:

265

# the non reference bytes to date, and the total references to

266

# date - saves reaccumulating on the second pass

267

key_offset_info.append((key, non_ref_bytes, total_references))

268

# key is literal, value is literal, there are 3 null's, 1 NL

269

# key is variable length tuple, \x00 between elements

270

non_ref_bytes += sum(len(element) for element in key)

271

if self._key_length > 1:

272

non_ref_bytes += self._key_length - 1

273

# value is literal bytes, there are 3 null's, 1 NL.

274

non_ref_bytes += len(value) + 3 + 1

275

# one byte for absent if set.

276

if absent:

277

non_ref_bytes += 1

278

elif self.reference_lists:

279

# (ref_lists -1) tabs

280

non_ref_bytes += self.reference_lists - 1

281

# (ref-1 cr's per ref_list)

282

for ref_list in references:

283

# how many references across the whole file?

284

total_references += len(ref_list)

285

# accrue reference separators

286

if ref_list:

287

non_ref_bytes += len(ref_list) - 1

288

# how many digits are needed to represent the total byte count?

289

digits = 1

290

possible_total_bytes = non_ref_bytes + total_references*digits

291

while 10 ** digits < possible_total_bytes:

292

digits += 1

293

possible_total_bytes = non_ref_bytes + total_references*digits

294

expected_bytes = possible_total_bytes + 1 # terminating newline

295

# resolve key addresses.

296

key_addresses = {}

297

for key, non_ref_bytes, total_references in key_offset_info:

298

key_addresses[key] = non_ref_bytes + total_references*digits

299

# serialise

300

format_string = '%%0%sd' % digits

301

for key, (absent, references, value) in nodes:

302

flattened_references = []

303

for ref_list in references:

304

ref_addresses = []

305

for reference in ref_list:

306

ref_addresses.append(format_string % key_addresses[reference])

307

flattened_references.append('\r'.join(ref_addresses))

308

string_key = '\x00'.join(key)

309

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

310

'\t'.join(flattened_references), value))

311

lines.append('\n')

312

result = StringIO(''.join(lines))

313

if expected_bytes and len(result.getvalue()) != expected_bytes:

314

raise errors.BzrError('Failed index creation. Internal error:'

315

' mismatched output length and expected length: %d %d' %

316

(len(result.getvalue()), expected_bytes))

317

return result

318

319

def set_optimize(self, for_size=None, combine_backing_indices=None):

320

"""Change how the builder tries to optimize the result.

321

322

:param for_size: Tell the builder to try and make the index as small as

323

possible.

324

:param combine_backing_indices: If the builder spills to disk to save

325

memory, should the on-disk indices be combined. Set to True if you

326

are going to be probing the index, but to False if you are not. (If

327

you are not querying, then the time spent combining is wasted.)

328

:return: None

329

"""

330

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

331

# other builders do.

332

if for_size is not None:

333

self._optimize_for_size = for_size

334

if combine_backing_indices is not None:

335

self._combine_backing_indices = combine_backing_indices

336

337

338

class GraphIndex(object):

339

"""An index for data with embedded graphs.

340

341

The index maps keys to a list of key reference lists, and a value.

342

Each node has the same number of key reference lists. Each key reference

343

list can be empty or an arbitrary length. The value is an opaque NULL

344

terminated string without any newlines. The storage of the index is

345

hidden in the interface: keys and key references are always tuples of

346

bytestrings, never the internal representation (e.g. dictionary offsets).

347

348

It is presumed that the index will not be mutated - it is static data.

349

350

Successive iter_all_entries calls will read the entire index each time.

351

Additionally, iter_entries calls will read the index linearly until the

352

desired keys are found. XXX: This must be fixed before the index is

353

suitable for production use. :XXX

354

"""

355

356

def __init__(self, transport, name, size):

357

"""Open an index called name on transport.

358

359

:param transport: A bzrlib.transport.Transport.

360

:param name: A path to provide to transport API calls.

361

:param size: The size of the index in bytes. This is used for bisection

362

logic to perform partial index reads. While the size could be

363

obtained by statting the file this introduced an additional round

364

trip as well as requiring stat'able transports, both of which are

365

avoided by having it supplied. If size is None, then bisection

366

support will be disabled and accessing the index will just stream

367

all the data.

368

"""

369

self._transport = transport

370

self._name = name

371

# Becomes a dict of key:(value, reference-list-byte-locations) used by

372

# the bisection interface to store parsed but not resolved keys.

373

self._bisect_nodes = None

374

# Becomes a dict of key:(value, reference-list-keys) which are ready to

375

# be returned directly to callers.

376

self._nodes = None

377

# a sorted list of slice-addresses for the parsed bytes of the file.

378

# e.g. (0,1) would mean that byte 0 is parsed.

379

self._parsed_byte_map = []

380

# a sorted list of keys matching each slice address for parsed bytes

381

# e.g. (None, 'foo@bar') would mean that the first byte contained no

382

# key, and the end byte of the slice is the of the data for 'foo@bar'

383

self._parsed_key_map = []

384

self._key_count = None

385

self._keys_by_offset = None

386

self._nodes_by_key = None

387

self._size = size

388

# The number of bytes we've read so far in trying to process this file

389

self._bytes_read = 0

390

391

def __eq__(self, other):

392

"""Equal when self and other were created with the same parameters."""

393

return (

394

type(self) == type(other) and

395

self._transport == other._transport and

396

self._name == other._name and

397

self._size == other._size)

398

399

def __ne__(self, other):

400

return not self.__eq__(other)

401

402

def __repr__(self):

403

return "%s(%r)" % (self.__class__.__name__,

404

self._transport.abspath(self._name))

405

406

def _buffer_all(self, stream=None):

407

"""Buffer all the index data.

408

409

Mutates self._nodes and self.keys_by_offset.

410

"""

411

if self._nodes is not None:

412

# We already did this

413

return

414

if 'index' in debug.debug_flags:

415

mutter('Reading entire index %s', self._transport.abspath(self._name))

416

if stream is None:

417

stream = self._transport.get(self._name)

418

self._read_prefix(stream)

419

self._expected_elements = 3 + self._key_length

420

line_count = 0

421

# raw data keyed by offset

422

self._keys_by_offset = {}

423

# ready-to-return key:value or key:value, node_ref_lists

424

self._nodes = {}

425

self._nodes_by_key = None

426

trailers = 0

427

pos = stream.tell()

428

lines = stream.read().split('\n')

429

del lines[-1]

430

_, _, _, trailers = self._parse_lines(lines, pos)

431

for key, absent, references, value in self._keys_by_offset.itervalues():

432

if absent:

433

continue

434

# resolve references:

435

if self.node_ref_lists:

436

node_value = (value, self._resolve_references(references))

437

else:

438

node_value = value

439

self._nodes[key] = node_value

440

# cache the keys for quick set intersections

441

self._keys = set(self._nodes)

442

if trailers != 1:

443

# there must be one line - the empty trailer line.

444

raise errors.BadIndexData(self)

445

446

def external_references(self, ref_list_num):

447

"""Return references that are not present in this index.

448

"""

449

self._buffer_all()

450

if ref_list_num + 1 > self.node_ref_lists:

451

raise ValueError('No ref list %d, index has %d ref lists'

452

% (ref_list_num, self.node_ref_lists))

453

refs = set()

454

for key, (value, ref_lists) in self._nodes.iteritems():

455

ref_list = ref_lists[ref_list_num]

456

refs.update(ref_list)

457

return refs - self._keys

458

459

def _get_nodes_by_key(self):

460

if self._nodes_by_key is None:

461

nodes_by_key = {}

462

if self.node_ref_lists:

463

for key, (value, references) in self._nodes.iteritems():

464

key_dict = nodes_by_key

465

for subkey in key[:-1]:

466

key_dict = key_dict.setdefault(subkey, {})

467

key_dict[key[-1]] = key, value, references

468

else:

469

for key, value in self._nodes.iteritems():

470

key_dict = nodes_by_key

471

for subkey in key[:-1]:

472

key_dict = key_dict.setdefault(subkey, {})

473

key_dict[key[-1]] = key, value

474

self._nodes_by_key = nodes_by_key

475

return self._nodes_by_key

476

477

def iter_all_entries(self):

478

"""Iterate over all keys within the index.

479

480

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

481

The former tuple is used when there are no reference lists in the

482

index, making the API compatible with simple key:value index types.

483

There is no defined order for the result iteration - it will be in

484

the most efficient order for the index.

485

"""

486

if 'evil' in debug.debug_flags:

487

trace.mutter_callsite(3,

488

"iter_all_entries scales with size of history.")

489

if self._nodes is None:

490

self._buffer_all()

491

if self.node_ref_lists:

492

for key, (value, node_ref_lists) in self._nodes.iteritems():

493

yield self, key, value, node_ref_lists

494

else:

495

for key, value in self._nodes.iteritems():

496

yield self, key, value

497

498

def _read_prefix(self, stream):

499

signature = stream.read(len(self._signature()))

500

if not signature == self._signature():

501

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

502

options_line = stream.readline()

503

if not options_line.startswith(_OPTION_NODE_REFS):

504

raise errors.BadIndexOptions(self)

505

try:

506

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

507

except ValueError:

508

raise errors.BadIndexOptions(self)

509

options_line = stream.readline()

510

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

511

raise errors.BadIndexOptions(self)

512

try:

513

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

514

except ValueError:

515

raise errors.BadIndexOptions(self)

516

options_line = stream.readline()

517

if not options_line.startswith(_OPTION_LEN):

518

raise errors.BadIndexOptions(self)

519

try:

520

self._key_count = int(options_line[len(_OPTION_LEN):-1])

521

except ValueError:

522

raise errors.BadIndexOptions(self)

523

524

def _resolve_references(self, references):

525

"""Return the resolved key references for references.

526

527

References are resolved by looking up the location of the key in the

528

_keys_by_offset map and substituting the key name, preserving ordering.

529

530

:param references: An iterable of iterables of key locations. e.g.

531

[[123, 456], [123]]

532

:return: A tuple of tuples of keys.

533

"""

534

node_refs = []

535

for ref_list in references:

536

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

537

return tuple(node_refs)

538

539

def _find_index(self, range_map, key):

540

"""Helper for the _parsed_*_index calls.

541

542

Given a range map - [(start, end), ...], finds the index of the range

543

in the map for key if it is in the map, and if it is not there, the

544

immediately preceeding range in the map.

545

"""

546

result = bisect_right(range_map, key) - 1

547

if result + 1 < len(range_map):

548

# check the border condition, it may be in result + 1

549

if range_map[result + 1][0] == key[0]:

550

return result + 1

551

return result

552

553

def _parsed_byte_index(self, offset):

554

"""Return the index of the entry immediately before offset.

555

556

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

557

there is one unparsed byte (the 11th, addressed as[10]). then:

558

asking for 0 will return 0

559

asking for 10 will return 0

560

asking for 11 will return 1

561

asking for 12 will return 1

562

"""

563

key = (offset, 0)

564

return self._find_index(self._parsed_byte_map, key)

565

566

def _parsed_key_index(self, key):

567

"""Return the index of the entry immediately before key.

568

569

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

570

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

571

have been parsed, then:

572

asking for '' will return 0

573

asking for 'a' will return 0

574

asking for 'b' will return 1

575

asking for 'e' will return 1

576

"""

577

search_key = (key, None)

578

return self._find_index(self._parsed_key_map, search_key)

579

580

def _is_parsed(self, offset):

581

"""Returns True if offset has been parsed."""

582

index = self._parsed_byte_index(offset)

583

if index == len(self._parsed_byte_map):

584

return offset < self._parsed_byte_map[index - 1][1]

585

start, end = self._parsed_byte_map[index]

586

return offset >= start and offset < end

587

588

def _iter_entries_from_total_buffer(self, keys):

589

"""Iterate over keys when the entire index is parsed."""

590

keys = keys.intersection(self._keys)

591

if self.node_ref_lists:

592

for key in keys:

593

value, node_refs = self._nodes[key]

594

yield self, key, value, node_refs

595

else:

596

for key in keys:

597

yield self, key, self._nodes[key]

598

599

def iter_entries(self, keys):

600

"""Iterate over keys within the index.

601

602

:param keys: An iterable providing the keys to be retrieved.

603

:return: An iterable as per iter_all_entries, but restricted to the

604

keys supplied. No additional keys will be returned, and every

605

key supplied that is in the index will be returned.

606

"""

607

keys = set(keys)

608

if not keys:

609

return []

610

if self._size is None and self._nodes is None:

611

self._buffer_all()

612

613

# We fit about 20 keys per minimum-read (4K), so if we are looking for

614

# more than 1/20th of the index its likely (assuming homogenous key

615

# spread) that we'll read the entire index. If we're going to do that,

616

# buffer the whole thing. A better analysis might take key spread into

617

# account - but B+Tree indices are better anyway.

618

# We could look at all data read, and use a threshold there, which will

619

# trigger on ancestry walks, but that is not yet fully mapped out.

620

if self._nodes is None and len(keys) * 20 > self.key_count():

621

self._buffer_all()

622

if self._nodes is not None:

623

return self._iter_entries_from_total_buffer(keys)

624

else:

625

return (result[1] for result in bisect_multi_bytes(

626

self._lookup_keys_via_location, self._size, keys))

627

628

def iter_entries_prefix(self, keys):

629

"""Iterate over keys within the index using prefix matching.

630

631

Prefix matching is applied within the tuple of a key, not to within

632

the bytestring of each key element. e.g. if you have the keys ('foo',

633

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

634

only the former key is returned.

635

636

WARNING: Note that this method currently causes a full index parse

637

unconditionally (which is reasonably appropriate as it is a means for

638

thunking many small indices into one larger one and still supplies

639

iter_all_entries at the thunk layer).

640

641

:param keys: An iterable providing the key prefixes to be retrieved.

642

Each key prefix takes the form of a tuple the length of a key, but

643

with the last N elements 'None' rather than a regular bytestring.

644

The first element cannot be 'None'.

645

:return: An iterable as per iter_all_entries, but restricted to the

646

keys with a matching prefix to those supplied. No additional keys

647

will be returned, and every match that is in the index will be

648

returned.

649

"""

650

keys = set(keys)

651

if not keys:

652

return

653

# load data - also finds key lengths

654

if self._nodes is None:

655

self._buffer_all()

656

if self._key_length == 1:

657

for key in keys:

658

# sanity check

659

if key[0] is None:

660

raise errors.BadIndexKey(key)

661

if len(key) != self._key_length:

662

raise errors.BadIndexKey(key)

663

if self.node_ref_lists:

664

value, node_refs = self._nodes[key]

665

yield self, key, value, node_refs

666

else:

667

yield self, key, self._nodes[key]

668

return

669

nodes_by_key = self._get_nodes_by_key()

670

for key in keys:

671

# sanity check

672

if key[0] is None:

673

raise errors.BadIndexKey(key)

674

if len(key) != self._key_length:

675

raise errors.BadIndexKey(key)

676

# find what it refers to:

677

key_dict = nodes_by_key

678

elements = list(key)

679

# find the subdict whose contents should be returned.

680

try:

681

while len(elements) and elements[0] is not None:

682

key_dict = key_dict[elements[0]]

683

elements.pop(0)

684

except KeyError:

685

# a non-existant lookup.

686

continue

687

if len(elements):

688

dicts = [key_dict]

689

while dicts:

690

key_dict = dicts.pop(-1)

691

# can't be empty or would not exist

692

item, value = key_dict.iteritems().next()

693

if type(value) == dict:

694

# push keys

695

dicts.extend(key_dict.itervalues())

696

else:

697

# yield keys

698

for value in key_dict.itervalues():

699

# each value is the key:value:node refs tuple

700

# ready to yield.

701

yield (self, ) + value

702

else:

703

# the last thing looked up was a terminal element

704

yield (self, ) + key_dict

705

706

def key_count(self):

707

"""Return an estimate of the number of keys in this index.

708

709

For GraphIndex the estimate is exact.

710

"""

711

if self._key_count is None:

712

self._read_and_parse([_HEADER_READV])

713

return self._key_count

714

715

def _lookup_keys_via_location(self, location_keys):

716

"""Public interface for implementing bisection.

717

718

If _buffer_all has been called, then all the data for the index is in

719

memory, and this method should not be called, as it uses a separate

720

cache because it cannot pre-resolve all indices, which buffer_all does

721

for performance.

722

723

:param location_keys: A list of location(byte offset), key tuples.

724

:return: A list of (location_key, result) tuples as expected by

725

bzrlib.bisect_multi.bisect_multi_bytes.

726

"""

727

# Possible improvements:

728

# - only bisect lookup each key once

729

# - sort the keys first, and use that to reduce the bisection window

730

# -----

731

# this progresses in three parts:

732

# read data

733

# parse it

734

# attempt to answer the question from the now in memory data.

735

# build the readv request

736

# for each location, ask for 800 bytes - much more than rows we've seen

737

# anywhere.

738

readv_ranges = []

739

for location, key in location_keys:

740

# can we answer from cache?

741

if self._bisect_nodes and key in self._bisect_nodes:

742

# We have the key parsed.

743

continue

744

index = self._parsed_key_index(key)

745

if (len(self._parsed_key_map) and

746

self._parsed_key_map[index][0] <= key and

747

(self._parsed_key_map[index][1] >= key or

748

# end of the file has been parsed

749

self._parsed_byte_map[index][1] == self._size)):

750

# the key has been parsed, so no lookup is needed even if its

751

# not present.

752

continue

753

# - if we have examined this part of the file already - yes

754

index = self._parsed_byte_index(location)

755

if (len(self._parsed_byte_map) and

756

self._parsed_byte_map[index][0] <= location and

757

self._parsed_byte_map[index][1] > location):

758

# the byte region has been parsed, so no read is needed.

759

continue

760

length = 800

761

if location + length > self._size:

762

length = self._size - location

763

# todo, trim out parsed locations.

764

if length > 0:

765

readv_ranges.append((location, length))

766

# read the header if needed

767

if self._bisect_nodes is None:

768

readv_ranges.append(_HEADER_READV)

769

self._read_and_parse(readv_ranges)

770

result = []

771

if self._nodes is not None:

772

# _read_and_parse triggered a _buffer_all because we requested the

773

# whole data range

774

for location, key in location_keys:

775

if key not in self._nodes: # not present

776

result.append(((location, key), False))

777

elif self.node_ref_lists:

778

value, refs = self._nodes[key]

779

result.append(((location, key),

780

(self, key, value, refs)))

781

else:

782

result.append(((location, key),

783

(self, key, self._nodes[key])))

784

return result

785

# generate results:

786

# - figure out <, >, missing, present

787

# - result present references so we can return them.

788

# keys that we cannot answer until we resolve references

789

pending_references = []

790

pending_locations = set()

791

for location, key in location_keys:

792

# can we answer from cache?

793

if key in self._bisect_nodes:

794

# the key has been parsed, so no lookup is needed

795

if self.node_ref_lists:

796

# the references may not have been all parsed.

797

value, refs = self._bisect_nodes[key]

798

wanted_locations = []

799

for ref_list in refs:

800

for ref in ref_list:

801

if ref not in self._keys_by_offset:

802

wanted_locations.append(ref)

803

if wanted_locations:

804

pending_locations.update(wanted_locations)

805

pending_references.append((location, key))

806

continue

807

result.append(((location, key), (self, key,

808

value, self._resolve_references(refs))))

809

else:

810

result.append(((location, key),

811

(self, key, self._bisect_nodes[key])))

812

continue

813

else:

814

# has the region the key should be in, been parsed?

815

index = self._parsed_key_index(key)

816

if (self._parsed_key_map[index][0] <= key and

817

(self._parsed_key_map[index][1] >= key or

818

# end of the file has been parsed

819

self._parsed_byte_map[index][1] == self._size)):

820

result.append(((location, key), False))

821

continue

822

# no, is the key above or below the probed location:

823

# get the range of the probed & parsed location

824

index = self._parsed_byte_index(location)

825

# if the key is below the start of the range, its below

826

if key < self._parsed_key_map[index][0]:

827

direction = -1

828

else:

829

direction = +1

830

result.append(((location, key), direction))

831

readv_ranges = []

832

# lookup data to resolve references

833

for location in pending_locations:

834

length = 800

835

if location + length > self._size:

836

length = self._size - location

837

# TODO: trim out parsed locations (e.g. if the 800 is into the

838

# parsed region trim it, and dont use the adjust_for_latency

839

# facility)

840

if length > 0:

841

readv_ranges.append((location, length))

842

self._read_and_parse(readv_ranges)

843

if self._nodes is not None:

844

# The _read_and_parse triggered a _buffer_all, grab the data and

845

# return it

846

for location, key in pending_references:

847

value, refs = self._nodes[key]

848

result.append(((location, key), (self, key, value, refs)))

849

return result

850

for location, key in pending_references:

851

# answer key references we had to look-up-late.

852

value, refs = self._bisect_nodes[key]

853

result.append(((location, key), (self, key,

854

value, self._resolve_references(refs))))

855

return result

856

857

def _parse_header_from_bytes(self, bytes):

858

"""Parse the header from a region of bytes.

859

860

:param bytes: The data to parse.

861

:return: An offset, data tuple such as readv yields, for the unparsed

862

data. (which may length 0).

863

"""

864

signature = bytes[0:len(self._signature())]

865

if not signature == self._signature():

866

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

867

lines = bytes[len(self._signature()):].splitlines()

868

options_line = lines[0]

869

if not options_line.startswith(_OPTION_NODE_REFS):

870

raise errors.BadIndexOptions(self)

871

try:

872

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

873

except ValueError:

874

raise errors.BadIndexOptions(self)

875

options_line = lines[1]

876

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

877

raise errors.BadIndexOptions(self)

878

try:

879

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

880

except ValueError:

881

raise errors.BadIndexOptions(self)

882

options_line = lines[2]

883

if not options_line.startswith(_OPTION_LEN):

884

raise errors.BadIndexOptions(self)

885

try:

886

self._key_count = int(options_line[len(_OPTION_LEN):])

887

except ValueError:

888

raise errors.BadIndexOptions(self)

889

# calculate the bytes we have processed

890

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

891

len(lines[2]) + 3)

892

self._parsed_bytes(0, None, header_end, None)

893

# setup parsing state

894

self._expected_elements = 3 + self._key_length

895

# raw data keyed by offset

896

self._keys_by_offset = {}

897

# keys with the value and node references

898

self._bisect_nodes = {}

899

return header_end, bytes[header_end:]

900

901

def _parse_region(self, offset, data):

902

"""Parse node data returned from a readv operation.

903

904

:param offset: The byte offset the data starts at.

905

:param data: The data to parse.

906

"""

907

# trim the data.

908

# end first:

909

end = offset + len(data)

910

high_parsed = offset

911

while True:

912

# Trivial test - if the current index's end is within the

913

# low-matching parsed range, we're done.

914

index = self._parsed_byte_index(high_parsed)

915

if end < self._parsed_byte_map[index][1]:

916

return

917

# print "[%d:%d]" % (offset, end), \

918

# self._parsed_byte_map[index:index + 2]

919

high_parsed, last_segment = self._parse_segment(

920

offset, data, end, index)

921

if last_segment:

922

return

923

924

def _parse_segment(self, offset, data, end, index):

925

"""Parse one segment of data.

926

927

:param offset: Where 'data' begins in the file.

928

:param data: Some data to parse a segment of.

929

:param end: Where data ends

930

:param index: The current index into the parsed bytes map.

931

:return: True if the parsed segment is the last possible one in the

932

range of data.

933

:return: high_parsed_byte, last_segment.

934

high_parsed_byte is the location of the highest parsed byte in this

935

segment, last_segment is True if the parsed segment is the last

936

possible one in the data block.

937

"""

938

# default is to use all data

939

trim_end = None

940

# accomodate overlap with data before this.

941

if offset < self._parsed_byte_map[index][1]:

942

# overlaps the lower parsed region

943

# skip the parsed data

944

trim_start = self._parsed_byte_map[index][1] - offset

945

# don't trim the start for \n

946

start_adjacent = True

947

elif offset == self._parsed_byte_map[index][1]:

948

# abuts the lower parsed region

949

# use all data

950

trim_start = None

951

# do not trim anything

952

start_adjacent = True

953

else:

954

# does not overlap the lower parsed region

955

# use all data

956

trim_start = None

957

# but trim the leading \n

958

start_adjacent = False

959

if end == self._size:

960

# lines up to the end of all data:

961

# use it all

962

trim_end = None

963

# do not strip to the last \n

964

end_adjacent = True

965

last_segment = True

966

elif index + 1 == len(self._parsed_byte_map):

967

# at the end of the parsed data

968

# use it all

969

trim_end = None

970

# but strip to the last \n

971

end_adjacent = False

972

last_segment = True

973

elif end == self._parsed_byte_map[index + 1][0]:

974

# buts up against the next parsed region

975

# use it all

976

trim_end = None

977

# do not strip to the last \n

978

end_adjacent = True

979

last_segment = True

980

elif end > self._parsed_byte_map[index + 1][0]:

981

# overlaps into the next parsed region

982

# only consider the unparsed data

983

trim_end = self._parsed_byte_map[index + 1][0] - offset

984

# do not strip to the last \n as we know its an entire record

985

end_adjacent = True

986

last_segment = end < self._parsed_byte_map[index + 1][1]

987

else:

988

# does not overlap into the next region

989

# use it all

990

trim_end = None

991

# but strip to the last \n

992

end_adjacent = False

993

last_segment = True

994

# now find bytes to discard if needed

995

if not start_adjacent:

996

# work around python bug in rfind

997

if trim_start is None:

998

trim_start = data.find('\n') + 1

999

else:

1000

trim_start = data.find('\n', trim_start) + 1

1001

if not (trim_start != 0):

1002

raise AssertionError('no \n was present')

1003

# print 'removing start', offset, trim_start, repr(data[:trim_start])

1004

if not end_adjacent:

1005

# work around python bug in rfind

1006

if trim_end is None:

1007

trim_end = data.rfind('\n') + 1

1008

else:

1009

trim_end = data.rfind('\n', None, trim_end) + 1

1010

if not (trim_end != 0):

1011

raise AssertionError('no \n was present')

1012

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1013

# adjust offset and data to the parseable data.

1014

trimmed_data = data[trim_start:trim_end]

1015

if not (trimmed_data):

1016

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1017

% (trim_start, trim_end, offset, offset + len(data)))

1018

if trim_start:

1019

offset += trim_start

1020

# print "parsing", repr(trimmed_data)

1021

# splitlines mangles the \r delimiters.. don't use it.

1022

lines = trimmed_data.split('\n')

1023

del lines[-1]

1024

pos = offset

1025

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1026

for key, value in nodes:

1027

self._bisect_nodes[key] = value

1028

self._parsed_bytes(offset, first_key,

1029

offset + len(trimmed_data), last_key)

1030

return offset + len(trimmed_data), last_segment

1031

1032

def _parse_lines(self, lines, pos):

1033

key = None

1034

first_key = None

1035

trailers = 0

1036

nodes = []

1037

for line in lines:

1038

if line == '':

1039

# must be at the end

1040

if self._size:

1041

if not (self._size == pos + 1):

1042

raise AssertionError("%s %s" % (self._size, pos))

1043

trailers += 1

1044

continue

1045

elements = line.split('\0')

1046

if len(elements) != self._expected_elements:

1047

raise errors.BadIndexData(self)

1048

# keys are tuples. Each element is a string that may occur many

1049

# times, so we intern them to save space. AB, RC, 200807

1050

key = tuple([intern(element) for element in elements[:self._key_length]])

1051

if first_key is None:

1052

first_key = key

1053

absent, references, value = elements[-3:]

1054

ref_lists = []

1055

for ref_string in references.split('\t'):

1056

ref_lists.append(tuple([

1057

int(ref) for ref in ref_string.split('\r') if ref

1058

]))

1059

ref_lists = tuple(ref_lists)

1060

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1061

pos += len(line) + 1 # +1 for the \n

1062

if absent:

1063

continue

1064

if self.node_ref_lists:

1065

node_value = (value, ref_lists)

1066

else:

1067

node_value = value

1068

nodes.append((key, node_value))

1069

# print "parsed ", key

1070

return first_key, key, nodes, trailers

1071

1072

def _parsed_bytes(self, start, start_key, end, end_key):

1073

"""Mark the bytes from start to end as parsed.

1074

1075

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1076

1) as parsed.

1077

1078

:param start: The start of the parsed region.

1079

:param end: The end of the parsed region.

1080

"""

1081

index = self._parsed_byte_index(start)

1082

new_value = (start, end)

1083

new_key = (start_key, end_key)

1084

if index == -1:

1085

# first range parsed is always the beginning.

1086

self._parsed_byte_map.insert(index, new_value)

1087

self._parsed_key_map.insert(index, new_key)

1088

return

1089

# four cases:

1090

# new region

1091

# extend lower region

1092

# extend higher region

1093

# combine two regions

1094

if (index + 1 < len(self._parsed_byte_map) and

1095

self._parsed_byte_map[index][1] == start and

1096

self._parsed_byte_map[index + 1][0] == end):

1097

# combine two regions

1098

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1099

self._parsed_byte_map[index + 1][1])

1100

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1101

self._parsed_key_map[index + 1][1])

1102

del self._parsed_byte_map[index + 1]

1103

del self._parsed_key_map[index + 1]

1104

elif self._parsed_byte_map[index][1] == start:

1105

# extend the lower entry

1106

self._parsed_byte_map[index] = (

1107

self._parsed_byte_map[index][0], end)

1108

self._parsed_key_map[index] = (

1109

self._parsed_key_map[index][0], end_key)

1110

elif (index + 1 < len(self._parsed_byte_map) and

1111

self._parsed_byte_map[index + 1][0] == end):

1112

# extend the higher entry

1113

self._parsed_byte_map[index + 1] = (

1114

start, self._parsed_byte_map[index + 1][1])

1115

self._parsed_key_map[index + 1] = (

1116

start_key, self._parsed_key_map[index + 1][1])

1117

else:

1118

# new entry

1119

self._parsed_byte_map.insert(index + 1, new_value)

1120

self._parsed_key_map.insert(index + 1, new_key)

1121

1122

def _read_and_parse(self, readv_ranges):

1123

"""Read the the ranges and parse the resulting data.

1124

1125

:param readv_ranges: A prepared readv range list.

1126

"""

1127

if not readv_ranges:

1128

return

1129

if self._nodes is None and self._bytes_read * 2 >= self._size:

1130

# We've already read more than 50% of the file and we are about to

1131

# request more data, just _buffer_all() and be done

1132

self._buffer_all()

1133

return

1134

1135

readv_data = self._transport.readv(self._name, readv_ranges, True,

1136

self._size)

1137

# parse

1138

for offset, data in readv_data:

1139

self._bytes_read += len(data)

1140

if offset == 0 and len(data) == self._size:

1141

# We read the whole range, most likely because the

1142

# Transport upcast our readv ranges into one long request

1143

# for enough total data to grab the whole index.

1144

self._buffer_all(StringIO(data))

1145

return

1146

if self._bisect_nodes is None:

1147

# this must be the start

1148

if not (offset == 0):

1149

raise AssertionError()

1150

offset, data = self._parse_header_from_bytes(data)

1151

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1152

self._parse_region(offset, data)

1153

1154

def _signature(self):

1155

"""The file signature for this index type."""

1156

return _SIGNATURE

1157

1158

def validate(self):

1159

"""Validate that everything in the index can be accessed."""

1160

# iter_all validates completely at the moment, so just do that.

1161

for node in self.iter_all_entries():

1162

pass

1163

1164

1165

class CombinedGraphIndex(object):

1166

"""A GraphIndex made up from smaller GraphIndices.

1167

1168

The backing indices must implement GraphIndex, and are presumed to be

1169

static data.

1170

1171

Queries against the combined index will be made against the first index,

1172

and then the second and so on. The order of index's can thus influence

1173

performance significantly. For example, if one index is on local disk and a

1174

second on a remote server, the local disk index should be before the other

1175

in the index list.

1176

"""

1177

1178

def __init__(self, indices, reload_func=None):

1179

"""Create a CombinedGraphIndex backed by indices.

1180

1181

:param indices: An ordered list of indices to query for data.

1182

:param reload_func: A function to call if we find we are missing an

1183

index. Should have the form reload_func() => True/False to indicate

1184

if reloading actually changed anything.

1185

"""

1186

self._indices = indices

1187

self._reload_func = reload_func

1188

1189

def __repr__(self):

1190

return "%s(%s)" % (

1191

self.__class__.__name__,

1192

', '.join(map(repr, self._indices)))

1193

1194

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1195

def get_parents(self, revision_ids):

1196

"""See graph._StackedParentsProvider.get_parents.

1197

1198

This implementation thunks the graph.Graph.get_parents api across to

1199

GraphIndex.

1200

1201

:param revision_ids: An iterable of graph keys for this graph.

1202

:return: A list of parent details for each key in revision_ids.

1203

Each parent details will be one of:

1204

* None when the key was missing

1205

* (NULL_REVISION,) when the key has no parents.

1206

* (parent_key, parent_key...) otherwise.

1207

"""

1208

parent_map = self.get_parent_map(revision_ids)

1209

return [parent_map.get(r, None) for r in revision_ids]

1210

1211

def get_parent_map(self, keys):

1212

"""See graph._StackedParentsProvider.get_parent_map"""

1213

search_keys = set(keys)

1214

if NULL_REVISION in search_keys:

1215

search_keys.discard(NULL_REVISION)

1216

found_parents = {NULL_REVISION:[]}

1217

else:

1218

found_parents = {}

1219

for index, key, value, refs in self.iter_entries(search_keys):

1220

parents = refs[0]

1221

if not parents:

1222

parents = (NULL_REVISION,)

1223

found_parents[key] = parents

1224

return found_parents

1225

1226

has_key = _has_key_from_parent_map

1227

1228

def insert_index(self, pos, index):

1229

"""Insert a new index in the list of indices to query.

1230

1231

:param pos: The position to insert the index.

1232

:param index: The index to insert.

1233

"""

1234

self._indices.insert(pos, index)

1235

1236

def iter_all_entries(self):

1237

"""Iterate over all keys within the index

1238

1239

Duplicate keys across child indices are presumed to have the same

1240

value and are only reported once.

1241

1242

:return: An iterable of (index, key, reference_lists, value).

1243

There is no defined order for the result iteration - it will be in

1244

the most efficient order for the index.

1245

"""

1246

seen_keys = set()

1247

while True:

1248

try:

1249

for index in self._indices:

1250

for node in index.iter_all_entries():

1251

if node[1] not in seen_keys:

1252

yield node

1253

seen_keys.add(node[1])

1254

return

1255

except errors.NoSuchFile:

1256

self._reload_or_raise()

1257

1258

def iter_entries(self, keys):

1259

"""Iterate over keys within the index.

1260

1261

Duplicate keys across child indices are presumed to have the same

1262

value and are only reported once.

1263

1264

:param keys: An iterable providing the keys to be retrieved.

1265

:return: An iterable of (index, key, reference_lists, value). There is no

1266

defined order for the result iteration - it will be in the most

1267

efficient order for the index.

1268

"""

1269

keys = set(keys)

1270

while True:

1271

try:

1272

for index in self._indices:

1273

if not keys:

1274

return

1275

for node in index.iter_entries(keys):

1276

keys.remove(node[1])

1277

yield node

1278

return

1279

except errors.NoSuchFile:

1280

self._reload_or_raise()

1281

1282

def iter_entries_prefix(self, keys):

1283

"""Iterate over keys within the index using prefix matching.

1284

1285

Duplicate keys across child indices are presumed to have the same

1286

value and are only reported once.

1287

1288

Prefix matching is applied within the tuple of a key, not to within

1289

the bytestring of each key element. e.g. if you have the keys ('foo',

1290

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1291

only the former key is returned.

1292

1293

:param keys: An iterable providing the key prefixes to be retrieved.

1294

Each key prefix takes the form of a tuple the length of a key, but

1295

with the last N elements 'None' rather than a regular bytestring.

1296

The first element cannot be 'None'.

1297

:return: An iterable as per iter_all_entries, but restricted to the

1298

keys with a matching prefix to those supplied. No additional keys

1299

will be returned, and every match that is in the index will be

1300

returned.

1301

"""

1302

keys = set(keys)

1303

if not keys:

1304

return

1305

seen_keys = set()

1306

while True:

1307

try:

1308

for index in self._indices:

1309

for node in index.iter_entries_prefix(keys):

1310

if node[1] in seen_keys:

1311

continue

1312

seen_keys.add(node[1])

1313

yield node

1314

return

1315

except errors.NoSuchFile:

1316

self._reload_or_raise()

1317

1318

def key_count(self):

1319

"""Return an estimate of the number of keys in this index.

1320

1321

For CombinedGraphIndex this is approximated by the sum of the keys of

1322

the child indices. As child indices may have duplicate keys this can

1323

have a maximum error of the number of child indices * largest number of

1324

keys in any index.

1325

"""

1326

while True:

1327

try:

1328

return sum((index.key_count() for index in self._indices), 0)

1329

except errors.NoSuchFile:

1330

self._reload_or_raise()

1331

1332

missing_keys = _missing_keys_from_parent_map

1333

1334

def _reload_or_raise(self):

1335

"""We just got a NoSuchFile exception.

1336

1337

Try to reload the indices, if it fails, just raise the current

1338

exception.

1339

"""

1340

if self._reload_func is None:

1341

raise

1342

exc_type, exc_value, exc_traceback = sys.exc_info()

1343

trace.mutter('Trying to reload after getting exception: %s',

1344

exc_value)

1345

if not self._reload_func():

1346

# We tried to reload, but nothing changed, so we fail anyway

1347

trace.mutter('_reload_func indicated nothing has changed.'

1348

' Raising original exception.')

1349

raise exc_type, exc_value, exc_traceback

1350

1351

def validate(self):

1352

"""Validate that everything in the index can be accessed."""

1353

while True:

1354

try:

1355

for index in self._indices:

1356

index.validate()

1357

return

1358

except errors.NoSuchFile:

1359

self._reload_or_raise()

1360

1361

1362

class InMemoryGraphIndex(GraphIndexBuilder):

1363

"""A GraphIndex which operates entirely out of memory and is mutable.

1364

1365

This is designed to allow the accumulation of GraphIndex entries during a

1366

single write operation, where the accumulated entries need to be immediately

1367

available - for example via a CombinedGraphIndex.

1368

"""

1369

1370

def add_nodes(self, nodes):

1371

"""Add nodes to the index.

1372

1373

:param nodes: An iterable of (key, node_refs, value) entries to add.

1374

"""

1375

if self.reference_lists:

1376

for (key, value, node_refs) in nodes:

1377

self.add_node(key, value, node_refs)

1378

else:

1379

for (key, value) in nodes:

1380

self.add_node(key, value)

1381

1382

def iter_all_entries(self):

1383

"""Iterate over all keys within the index

1384

1385

:return: An iterable of (index, key, reference_lists, value). There is no

1386

defined order for the result iteration - it will be in the most

1387

efficient order for the index (in this case dictionary hash order).

1388

"""

1389

if 'evil' in debug.debug_flags:

1390

trace.mutter_callsite(3,

1391

"iter_all_entries scales with size of history.")

1392

if self.reference_lists:

1393

for key, (absent, references, value) in self._nodes.iteritems():

1394

if not absent:

1395

yield self, key, value, references

1396

else:

1397

for key, (absent, references, value) in self._nodes.iteritems():

1398

if not absent:

1399

yield self, key, value

1400

1401

def iter_entries(self, keys):

1402

"""Iterate over keys within the index.

1403

1404

:param keys: An iterable providing the keys to be retrieved.

1405

:return: An iterable of (index, key, value, reference_lists). There is no

1406

defined order for the result iteration - it will be in the most

1407

efficient order for the index (keys iteration order in this case).

1408

"""

1409

keys = set(keys)

1410

if self.reference_lists:

1411

for key in keys.intersection(self._keys):

1412

node = self._nodes[key]

1413

if not node[0]:

1414

yield self, key, node[2], node[1]

1415

else:

1416

for key in keys.intersection(self._keys):

1417

node = self._nodes[key]

1418

if not node[0]:

1419

yield self, key, node[2]

1420

1421

def iter_entries_prefix(self, keys):

1422

"""Iterate over keys within the index using prefix matching.

1423

1424

Prefix matching is applied within the tuple of a key, not to within

1425

the bytestring of each key element. e.g. if you have the keys ('foo',

1426

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1427

only the former key is returned.

1428

1429

:param keys: An iterable providing the key prefixes to be retrieved.

1430

Each key prefix takes the form of a tuple the length of a key, but

1431

with the last N elements 'None' rather than a regular bytestring.

1432

The first element cannot be 'None'.

1433

:return: An iterable as per iter_all_entries, but restricted to the

1434

keys with a matching prefix to those supplied. No additional keys

1435

will be returned, and every match that is in the index will be

1436

returned.

1437

"""

1438

# XXX: To much duplication with the GraphIndex class; consider finding

1439

# a good place to pull out the actual common logic.

1440

keys = set(keys)

1441

if not keys:

1442

return

1443

if self._key_length == 1:

1444

for key in keys:

1445

# sanity check

1446

if key[0] is None:

1447

raise errors.BadIndexKey(key)

1448

if len(key) != self._key_length:

1449

raise errors.BadIndexKey(key)

1450

node = self._nodes[key]

1451

if node[0]:

1452

continue

1453

if self.reference_lists:

1454

yield self, key, node[2], node[1]

1455

else:

1456

yield self, key, node[2]

1457

return

1458

nodes_by_key = self._get_nodes_by_key()

1459

for key in keys:

1460

# sanity check

1461

if key[0] is None:

1462

raise errors.BadIndexKey(key)

1463

if len(key) != self._key_length:

1464

raise errors.BadIndexKey(key)

1465

# find what it refers to:

1466

key_dict = nodes_by_key

1467

elements = list(key)

1468

# find the subdict to return

1469

try:

1470

while len(elements) and elements[0] is not None:

1471

key_dict = key_dict[elements[0]]

1472

elements.pop(0)

1473

except KeyError:

1474

# a non-existant lookup.

1475

continue

1476

if len(elements):

1477

dicts = [key_dict]

1478

while dicts:

1479

key_dict = dicts.pop(-1)

1480

# can't be empty or would not exist

1481

item, value = key_dict.iteritems().next()

1482

if type(value) == dict:

1483

# push keys

1484

dicts.extend(key_dict.itervalues())

1485

else:

1486

# yield keys

1487

for value in key_dict.itervalues():

1488

yield (self, ) + value

1489

else:

1490

yield (self, ) + key_dict

1491

1492

def key_count(self):

1493

"""Return an estimate of the number of keys in this index.

1494

1495

For InMemoryGraphIndex the estimate is exact.

1496

"""

1497

return len(self._keys)

1498

1499

def validate(self):

1500

"""In memory index's have no known corruption at the moment."""

1501

1502

1503

class GraphIndexPrefixAdapter(object):

1504

"""An adapter between GraphIndex with different key lengths.

1505

1506

Queries against this will emit queries against the adapted Graph with the

1507

prefix added, queries for all items use iter_entries_prefix. The returned

1508

nodes will have their keys and node references adjusted to remove the

1509

prefix. Finally, an add_nodes_callback can be supplied - when called the

1510

nodes and references being added will have prefix prepended.

1511

"""

1512

1513

def __init__(self, adapted, prefix, missing_key_length,

1514

add_nodes_callback=None):

1515

"""Construct an adapter against adapted with prefix."""

1516

self.adapted = adapted

1517

self.prefix_key = prefix + (None,)*missing_key_length

1518

self.prefix = prefix

1519

self.prefix_len = len(prefix)

1520

self.add_nodes_callback = add_nodes_callback

1521

1522

def add_nodes(self, nodes):

1523

"""Add nodes to the index.

1524

1525

:param nodes: An iterable of (key, node_refs, value) entries to add.

1526

"""

1527

# save nodes in case its an iterator

1528

nodes = tuple(nodes)

1529

translated_nodes = []

1530

try:

1531

# Add prefix_key to each reference node_refs is a tuple of tuples,

1532

# so split it apart, and add prefix_key to the internal reference

1533

for (key, value, node_refs) in nodes:

1534

adjusted_references = (

1535

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1536

for ref_list in node_refs))

1537

translated_nodes.append((self.prefix + key, value,

1538

adjusted_references))

1539

except ValueError:

1540

# XXX: TODO add an explicit interface for getting the reference list

1541

# status, to handle this bit of user-friendliness in the API more

1542

# explicitly.

1543

for (key, value) in nodes:

1544

translated_nodes.append((self.prefix + key, value))

1545

self.add_nodes_callback(translated_nodes)

1546

1547

def add_node(self, key, value, references=()):

1548

"""Add a node to the index.

1549

1550

:param key: The key. keys are non-empty tuples containing

1551

as many whitespace-free utf8 bytestrings as the key length

1552

defined for this index.

1553

:param references: An iterable of iterables of keys. Each is a

1554

reference to another key.

1555

:param value: The value to associate with the key. It may be any

1556

bytes as long as it does not contain \0 or \n.

1557

"""

1558

self.add_nodes(((key, value, references), ))

1559

1560

def _strip_prefix(self, an_iter):

1561

"""Strip prefix data from nodes and return it."""

1562

for node in an_iter:

1563

# cross checks

1564

if node[1][:self.prefix_len] != self.prefix:

1565

raise errors.BadIndexData(self)

1566

for ref_list in node[3]:

1567

for ref_node in ref_list:

1568

if ref_node[:self.prefix_len] != self.prefix:

1569

raise errors.BadIndexData(self)

1570

yield node[0], node[1][self.prefix_len:], node[2], (

1571

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1572

for ref_list in node[3]))

1573

1574

def iter_all_entries(self):

1575

"""Iterate over all keys within the index

1576

1577

iter_all_entries is implemented against the adapted index using

1578

iter_entries_prefix.

1579

1580

:return: An iterable of (index, key, reference_lists, value). There is no

1581

defined order for the result iteration - it will be in the most

1582

efficient order for the index (in this case dictionary hash order).

1583

"""

1584

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1585

1586

def iter_entries(self, keys):

1587

"""Iterate over keys within the index.

1588

1589

:param keys: An iterable providing the keys to be retrieved.

1590

:return: An iterable of (index, key, value, reference_lists). There is no

1591

defined order for the result iteration - it will be in the most

1592

efficient order for the index (keys iteration order in this case).

1593

"""

1594

return self._strip_prefix(self.adapted.iter_entries(

1595

self.prefix + key for key in keys))

1596

1597

def iter_entries_prefix(self, keys):

1598

"""Iterate over keys within the index using prefix matching.

1599

1600

Prefix matching is applied within the tuple of a key, not to within

1601

the bytestring of each key element. e.g. if you have the keys ('foo',

1602

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1603

only the former key is returned.

1604

1605

:param keys: An iterable providing the key prefixes to be retrieved.

1606

Each key prefix takes the form of a tuple the length of a key, but

1607

with the last N elements 'None' rather than a regular bytestring.

1608

The first element cannot be 'None'.

1609

:return: An iterable as per iter_all_entries, but restricted to the

1610

keys with a matching prefix to those supplied. No additional keys

1611

will be returned, and every match that is in the index will be

1612

returned.

1613

"""

1614

return self._strip_prefix(self.adapted.iter_entries_prefix(

1615

self.prefix + key for key in keys))

1616

1617

def key_count(self):

1618

"""Return an estimate of the number of keys in this index.

1619

1620

For GraphIndexPrefixAdapter this is relatively expensive - key

1621

iteration with the prefix is done.

1622

"""

1623

return len(list(self.iter_all_entries()))

1624

1625

def validate(self):

1626

"""Call the adapted's validate."""

1627

self.adapted.validate()

Older »