/brz/remove-bazaar : revision 3948.3.8

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Martin Pool
Date: 2009-03-23 07:25:27 UTC
mfrom: (4183 +trunk)
mto: This revision was merged to the branch mainline in revision 4189.
Revision ID: mbp@sourcefrog.net-20090323072527-317my4n8zej1g6v9

merge trunk

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

doc/news-template.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

100

self._key_length = key_elements

101

self._optimize_for_size = False

102

103

def _check_key(self, key):

104

"""Raise BadIndexKey if key is not a valid key for this index."""

105

if type(key) != tuple:

106

raise errors.BadIndexKey(key)

107

if self._key_length != len(key):

108

raise errors.BadIndexKey(key)

109

for element in key:

110

if not element or _whitespace_re.search(element) is not None:

111

raise errors.BadIndexKey(element)

112

113

def _external_references(self):

114

"""Return references that are not present in this index.

115

"""

116

keys = set()

117

refs = set()

118

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

119

# lists are used. It is currently correct for pack-0.92 through

120

# 1.9, which use the node references (3rd column) second

121

# reference list as the compression parent. Perhaps this should

122

# be moved into something higher up the stack, since it

123

# makes assumptions about how the index is used.

124

if self.reference_lists > 1:

125

for node in self.iter_all_entries():

126

keys.add(node[1])

127

refs.update(node[3][1])

128

return refs - keys

129

else:

130

# If reference_lists == 0 there can be no external references, and

131

# if reference_lists == 1, then there isn't a place to store the

132

# compression parent

133

return set()

134

135

def _get_nodes_by_key(self):

136

if self._nodes_by_key is None:

137

nodes_by_key = {}

138

if self.reference_lists:

139

for key, (absent, references, value) in self._nodes.iteritems():

140

if absent:

141

continue

142

key_dict = nodes_by_key

143

for subkey in key[:-1]:

144

key_dict = key_dict.setdefault(subkey, {})

145

key_dict[key[-1]] = key, value, references

146

else:

147

for key, (absent, references, value) in self._nodes.iteritems():

148

if absent:

149

continue

150

key_dict = nodes_by_key

151

for subkey in key[:-1]:

152

key_dict = key_dict.setdefault(subkey, {})

153

key_dict[key[-1]] = key, value

154

self._nodes_by_key = nodes_by_key

155

return self._nodes_by_key

156

157

def _update_nodes_by_key(self, key, value, node_refs):

158

"""Update the _nodes_by_key dict with a new key.

159

160

For a key of (foo, bar, baz) create

161

_nodes_by_key[foo][bar][baz] = key_value

162

"""

163

if self._nodes_by_key is None:

164

return

165

key_dict = self._nodes_by_key

166

if self.reference_lists:

167

key_value = key, value, node_refs

168

else:

169

key_value = key, value

170

for subkey in key[:-1]:

171

key_dict = key_dict.setdefault(subkey, {})

172

key_dict[key[-1]] = key_value

173

174

def _check_key_ref_value(self, key, references, value):

175

"""Check that 'key' and 'references' are all valid.

176

177

:param key: A key tuple. Must conform to the key interface (be a tuple,

178

be of the right length, not have any whitespace or nulls in any key

179

element.)

180

:param references: An iterable of reference lists. Something like

181

[[(ref, key)], [(ref, key), (other, key)]]

182

:param value: The value associate with this key. Must not contain

183

newlines or null characters.

184

:return: (node_refs, absent_references)

185

node_refs basically a packed form of 'references' where all

186

iterables are tuples

187

absent_references reference keys that are not in self._nodes.

188

This may contain duplicates if the same key is

189

referenced in multiple lists.

190

"""

191

self._check_key(key)

192

if _newline_null_re.search(value) is not None:

193

raise errors.BadIndexValue(value)

194

if len(references) != self.reference_lists:

195

raise errors.BadIndexValue(references)

196

node_refs = []

197

absent_references = []

198

for reference_list in references:

199

for reference in reference_list:

200

# If reference *is* in self._nodes, then we know it has already

201

# been checked.

202

if reference not in self._nodes:

203

self._check_key(reference)

204

absent_references.append(reference)

205

node_refs.append(tuple(reference_list))

206

return tuple(node_refs), absent_references

207

208

def add_node(self, key, value, references=()):

209

"""Add a node to the index.

210

211

:param key: The key. keys are non-empty tuples containing

212

as many whitespace-free utf8 bytestrings as the key length

213

defined for this index.

214

:param references: An iterable of iterables of keys. Each is a

215

reference to another key.

216

:param value: The value to associate with the key. It may be any

217

bytes as long as it does not contain \0 or \n.

218

"""

219

(node_refs,

220

absent_references) = self._check_key_ref_value(key, references, value)

221

if key in self._nodes and self._nodes[key][0] != 'a':

222

raise errors.BadIndexDuplicateKey(key, self)

223

for reference in absent_references:

224

# There may be duplicates, but I don't think it is worth worrying

225

# about

226

self._nodes[reference] = ('a', (), '')

227

self._nodes[key] = ('', node_refs, value)

228

self._keys.add(key)

229

if self._nodes_by_key is not None and self._key_length > 1:

230

self._update_nodes_by_key(key, value, node_refs)

231

232

def finish(self):

233

lines = [_SIGNATURE]

234

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

235

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

236

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

237

prefix_length = sum(len(x) for x in lines)

238

# references are byte offsets. To avoid having to do nasty

239

# polynomial work to resolve offsets (references to later in the

240

# file cannot be determined until all the inbetween references have

241

# been calculated too) we pad the offsets with 0's to make them be

242

# of consistent length. Using binary offsets would break the trivial

243

# file parsing.

244

# to calculate the width of zero's needed we do three passes:

245

# one to gather all the non-reference data and the number of references.

246

# one to pad all the data with reference-length and determine entry

247

# addresses.

248

# One to serialise.

249

250

# forward sorted by key. In future we may consider topological sorting,

251

# at the cost of table scans for direct lookup, or a second index for

252

# direct lookup

253

nodes = sorted(self._nodes.items())

254

# if we do not prepass, we don't know how long it will be up front.

255

expected_bytes = None

256

# we only need to pre-pass if we have reference lists at all.

257

if self.reference_lists:

258

key_offset_info = []

259

non_ref_bytes = prefix_length

260

total_references = 0

261

# TODO use simple multiplication for the constants in this loop.

262

for key, (absent, references, value) in nodes:

263

# record the offset known *so far* for this key:

264

# the non reference bytes to date, and the total references to

265

# date - saves reaccumulating on the second pass

266

key_offset_info.append((key, non_ref_bytes, total_references))

267

# key is literal, value is literal, there are 3 null's, 1 NL

268

# key is variable length tuple, \x00 between elements

269

non_ref_bytes += sum(len(element) for element in key)

270

if self._key_length > 1:

271

non_ref_bytes += self._key_length - 1

272

# value is literal bytes, there are 3 null's, 1 NL.

273

non_ref_bytes += len(value) + 3 + 1

274

# one byte for absent if set.

275

if absent:

276

non_ref_bytes += 1

277

elif self.reference_lists:

278

# (ref_lists -1) tabs

279

non_ref_bytes += self.reference_lists - 1

280

# (ref-1 cr's per ref_list)

281

for ref_list in references:

282

# how many references across the whole file?

283

total_references += len(ref_list)

284

# accrue reference separators

285

if ref_list:

286

non_ref_bytes += len(ref_list) - 1

287

# how many digits are needed to represent the total byte count?

288

digits = 1

289

possible_total_bytes = non_ref_bytes + total_references*digits

290

while 10 ** digits < possible_total_bytes:

291

digits += 1

292

possible_total_bytes = non_ref_bytes + total_references*digits

293

expected_bytes = possible_total_bytes + 1 # terminating newline

294

# resolve key addresses.

295

key_addresses = {}

296

for key, non_ref_bytes, total_references in key_offset_info:

297

key_addresses[key] = non_ref_bytes + total_references*digits

298

# serialise

299

format_string = '%%0%sd' % digits

300

for key, (absent, references, value) in nodes:

301

flattened_references = []

302

for ref_list in references:

303

ref_addresses = []

304

for reference in ref_list:

305

ref_addresses.append(format_string % key_addresses[reference])

306

flattened_references.append('\r'.join(ref_addresses))

307

string_key = '\x00'.join(key)

308

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

309

'\t'.join(flattened_references), value))

310

lines.append('\n')

311

result = StringIO(''.join(lines))

312

if expected_bytes and len(result.getvalue()) != expected_bytes:

313

raise errors.BzrError('Failed index creation. Internal error:'

314

' mismatched output length and expected length: %d %d' %

315

(len(result.getvalue()), expected_bytes))

316

return result

317

318

def set_optimize(self, for_size=True):

319

"""Change how the builder tries to optimize the result.

320

321

:param for_size: Tell the builder to try and make the index as small as

322

possible.

323

:return: None

324

"""

325

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

326

# other builders do.

327

self._optimize_for_size = for_size

328

329

330

class GraphIndex(object):

331

"""An index for data with embedded graphs.

332

333

The index maps keys to a list of key reference lists, and a value.

334

Each node has the same number of key reference lists. Each key reference

335

list can be empty or an arbitrary length. The value is an opaque NULL

336

terminated string without any newlines. The storage of the index is

337

hidden in the interface: keys and key references are always tuples of

338

bytestrings, never the internal representation (e.g. dictionary offsets).

339

340

It is presumed that the index will not be mutated - it is static data.

341

342

Successive iter_all_entries calls will read the entire index each time.

343

Additionally, iter_entries calls will read the index linearly until the

344

desired keys are found. XXX: This must be fixed before the index is

345

suitable for production use. :XXX

346

"""

347

348

def __init__(self, transport, name, size):

349

"""Open an index called name on transport.

350

351

:param transport: A bzrlib.transport.Transport.

352

:param name: A path to provide to transport API calls.

353

:param size: The size of the index in bytes. This is used for bisection

354

logic to perform partial index reads. While the size could be

355

obtained by statting the file this introduced an additional round

356

trip as well as requiring stat'able transports, both of which are

357

avoided by having it supplied. If size is None, then bisection

358

support will be disabled and accessing the index will just stream

359

all the data.

360

"""

361

self._transport = transport

362

self._name = name

363

# Becomes a dict of key:(value, reference-list-byte-locations) used by

364

# the bisection interface to store parsed but not resolved keys.

365

self._bisect_nodes = None

366

# Becomes a dict of key:(value, reference-list-keys) which are ready to

367

# be returned directly to callers.

368

self._nodes = None

369

# a sorted list of slice-addresses for the parsed bytes of the file.

370

# e.g. (0,1) would mean that byte 0 is parsed.

371

self._parsed_byte_map = []

372

# a sorted list of keys matching each slice address for parsed bytes

373

# e.g. (None, 'foo@bar') would mean that the first byte contained no

374

# key, and the end byte of the slice is the of the data for 'foo@bar'

375

self._parsed_key_map = []

376

self._key_count = None

377

self._keys_by_offset = None

378

self._nodes_by_key = None

379

self._size = size

380

# The number of bytes we've read so far in trying to process this file

381

self._bytes_read = 0

382

383

def __eq__(self, other):

384

"""Equal when self and other were created with the same parameters."""

385

return (

386

type(self) == type(other) and

387

self._transport == other._transport and

388

self._name == other._name and

389

self._size == other._size)

390

391

def __ne__(self, other):

392

return not self.__eq__(other)

393

394

def __repr__(self):

395

return "%s(%r)" % (self.__class__.__name__,

396

self._transport.abspath(self._name))

397

398

def _buffer_all(self, stream=None):

399

"""Buffer all the index data.

400

401

Mutates self._nodes and self.keys_by_offset.

402

"""

403

if self._nodes is not None:

404

# We already did this

405

return

406

if 'index' in debug.debug_flags:

407

mutter('Reading entire index %s', self._transport.abspath(self._name))

408

if stream is None:

409

stream = self._transport.get(self._name)

410

self._read_prefix(stream)

411

self._expected_elements = 3 + self._key_length

412

line_count = 0

413

# raw data keyed by offset

414

self._keys_by_offset = {}

415

# ready-to-return key:value or key:value, node_ref_lists

416

self._nodes = {}

417

self._nodes_by_key = None

418

trailers = 0

419

pos = stream.tell()

420

lines = stream.read().split('\n')

421

del lines[-1]

422

_, _, _, trailers = self._parse_lines(lines, pos)

423

for key, absent, references, value in self._keys_by_offset.itervalues():

424

if absent:

425

continue

426

# resolve references:

427

if self.node_ref_lists:

428

node_value = (value, self._resolve_references(references))

429

else:

430

node_value = value

431

self._nodes[key] = node_value

432

# cache the keys for quick set intersections

433

self._keys = set(self._nodes)

434

if trailers != 1:

435

# there must be one line - the empty trailer line.

436

raise errors.BadIndexData(self)

437

438

def external_references(self, ref_list_num):

439

"""Return references that are not present in this index.

440

"""

441

self._buffer_all()

442

if ref_list_num + 1 > self.node_ref_lists:

443

raise ValueError('No ref list %d, index has %d ref lists'

444

% (ref_list_num, self.node_ref_lists))

445

refs = set()

446

for key, (value, ref_lists) in self._nodes.iteritems():

447

ref_list = ref_lists[ref_list_num]

448

refs.update(ref_list)

449

return refs - self._keys

450

451

def _get_nodes_by_key(self):

452

if self._nodes_by_key is None:

453

nodes_by_key = {}

454

if self.node_ref_lists:

455

for key, (value, references) in self._nodes.iteritems():

456

key_dict = nodes_by_key

457

for subkey in key[:-1]:

458

key_dict = key_dict.setdefault(subkey, {})

459

key_dict[key[-1]] = key, value, references

460

else:

461

for key, value in self._nodes.iteritems():

462

key_dict = nodes_by_key

463

for subkey in key[:-1]:

464

key_dict = key_dict.setdefault(subkey, {})

465

key_dict[key[-1]] = key, value

466

self._nodes_by_key = nodes_by_key

467

return self._nodes_by_key

468

469

def iter_all_entries(self):

470

"""Iterate over all keys within the index.

471

472

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

473

The former tuple is used when there are no reference lists in the

474

index, making the API compatible with simple key:value index types.

475

There is no defined order for the result iteration - it will be in

476

the most efficient order for the index.

477

"""

478

if 'evil' in debug.debug_flags:

479

trace.mutter_callsite(3,

480

"iter_all_entries scales with size of history.")

481

if self._nodes is None:

482

self._buffer_all()

483

if self.node_ref_lists:

484

for key, (value, node_ref_lists) in self._nodes.iteritems():

485

yield self, key, value, node_ref_lists

486

else:

487

for key, value in self._nodes.iteritems():

488

yield self, key, value

489

490

def _read_prefix(self, stream):

491

signature = stream.read(len(self._signature()))

492

if not signature == self._signature():

493

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

494

options_line = stream.readline()

495

if not options_line.startswith(_OPTION_NODE_REFS):

496

raise errors.BadIndexOptions(self)

497

try:

498

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

499

except ValueError:

500

raise errors.BadIndexOptions(self)

501

options_line = stream.readline()

502

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

503

raise errors.BadIndexOptions(self)

504

try:

505

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

506

except ValueError:

507

raise errors.BadIndexOptions(self)

508

options_line = stream.readline()

509

if not options_line.startswith(_OPTION_LEN):

510

raise errors.BadIndexOptions(self)

511

try:

512

self._key_count = int(options_line[len(_OPTION_LEN):-1])

513

except ValueError:

514

raise errors.BadIndexOptions(self)

515

516

def _resolve_references(self, references):

517

"""Return the resolved key references for references.

518

519

References are resolved by looking up the location of the key in the

520

_keys_by_offset map and substituting the key name, preserving ordering.

521

522

:param references: An iterable of iterables of key locations. e.g.

523

[[123, 456], [123]]

524

:return: A tuple of tuples of keys.

525

"""

526

node_refs = []

527

for ref_list in references:

528

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

529

return tuple(node_refs)

530

531

def _find_index(self, range_map, key):

532

"""Helper for the _parsed_*_index calls.

533

534

Given a range map - [(start, end), ...], finds the index of the range

535

in the map for key if it is in the map, and if it is not there, the

536

immediately preceeding range in the map.

537

"""

538

result = bisect_right(range_map, key) - 1

539

if result + 1 < len(range_map):

540

# check the border condition, it may be in result + 1

541

if range_map[result + 1][0] == key[0]:

542

return result + 1

543

return result

544

545

def _parsed_byte_index(self, offset):

546

"""Return the index of the entry immediately before offset.

547

548

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

549

there is one unparsed byte (the 11th, addressed as[10]). then:

550

asking for 0 will return 0

551

asking for 10 will return 0

552

asking for 11 will return 1

553

asking for 12 will return 1

554

"""

555

key = (offset, 0)

556

return self._find_index(self._parsed_byte_map, key)

557

558

def _parsed_key_index(self, key):

559

"""Return the index of the entry immediately before key.

560

561

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

562

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

563

have been parsed, then:

564

asking for '' will return 0

565

asking for 'a' will return 0

566

asking for 'b' will return 1

567

asking for 'e' will return 1

568

"""

569

search_key = (key, None)

570

return self._find_index(self._parsed_key_map, search_key)

571

572

def _is_parsed(self, offset):

573

"""Returns True if offset has been parsed."""

574

index = self._parsed_byte_index(offset)

575

if index == len(self._parsed_byte_map):

576

return offset < self._parsed_byte_map[index - 1][1]

577

start, end = self._parsed_byte_map[index]

578

return offset >= start and offset < end

579

580

def _iter_entries_from_total_buffer(self, keys):

581

"""Iterate over keys when the entire index is parsed."""

582

keys = keys.intersection(self._keys)

583

if self.node_ref_lists:

584

for key in keys:

585

value, node_refs = self._nodes[key]

586

yield self, key, value, node_refs

587

else:

588

for key in keys:

589

yield self, key, self._nodes[key]

590

591

def iter_entries(self, keys):

592

"""Iterate over keys within the index.

593

594

:param keys: An iterable providing the keys to be retrieved.

595

:return: An iterable as per iter_all_entries, but restricted to the

596

keys supplied. No additional keys will be returned, and every

597

key supplied that is in the index will be returned.

598

"""

599

keys = set(keys)

600

if not keys:

601

return []

602

if self._size is None and self._nodes is None:

603

self._buffer_all()

604

605

# We fit about 20 keys per minimum-read (4K), so if we are looking for

606

# more than 1/20th of the index its likely (assuming homogenous key

607

# spread) that we'll read the entire index. If we're going to do that,

608

# buffer the whole thing. A better analysis might take key spread into

609

# account - but B+Tree indices are better anyway.

610

# We could look at all data read, and use a threshold there, which will

611

# trigger on ancestry walks, but that is not yet fully mapped out.

612

if self._nodes is None and len(keys) * 20 > self.key_count():

613

self._buffer_all()

614

if self._nodes is not None:

615

return self._iter_entries_from_total_buffer(keys)

616

else:

617

return (result[1] for result in bisect_multi_bytes(

618

self._lookup_keys_via_location, self._size, keys))

619

620

def iter_entries_prefix(self, keys):

621

"""Iterate over keys within the index using prefix matching.

622

623

Prefix matching is applied within the tuple of a key, not to within

624

the bytestring of each key element. e.g. if you have the keys ('foo',

625

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

626

only the former key is returned.

627

628

WARNING: Note that this method currently causes a full index parse

629

unconditionally (which is reasonably appropriate as it is a means for

630

thunking many small indices into one larger one and still supplies

631

iter_all_entries at the thunk layer).

632

633

:param keys: An iterable providing the key prefixes to be retrieved.

634

Each key prefix takes the form of a tuple the length of a key, but

635

with the last N elements 'None' rather than a regular bytestring.

636

The first element cannot be 'None'.

637

:return: An iterable as per iter_all_entries, but restricted to the

638

keys with a matching prefix to those supplied. No additional keys

639

will be returned, and every match that is in the index will be

640

returned.

641

"""

642

keys = set(keys)

643

if not keys:

644

return

645

# load data - also finds key lengths

646

if self._nodes is None:

647

self._buffer_all()

648

if self._key_length == 1:

649

for key in keys:

650

# sanity check

651

if key[0] is None:

652

raise errors.BadIndexKey(key)

653

if len(key) != self._key_length:

654

raise errors.BadIndexKey(key)

655

if self.node_ref_lists:

656

value, node_refs = self._nodes[key]

657

yield self, key, value, node_refs

658

else:

659

yield self, key, self._nodes[key]

660

return

661

nodes_by_key = self._get_nodes_by_key()

662

for key in keys:

663

# sanity check

664

if key[0] is None:

665

raise errors.BadIndexKey(key)

666

if len(key) != self._key_length:

667

raise errors.BadIndexKey(key)

668

# find what it refers to:

669

key_dict = nodes_by_key

670

elements = list(key)

671

# find the subdict whose contents should be returned.

672

try:

673

while len(elements) and elements[0] is not None:

674

key_dict = key_dict[elements[0]]

675

elements.pop(0)

676

except KeyError:

677

# a non-existant lookup.

678

continue

679

if len(elements):

680

dicts = [key_dict]

681

while dicts:

682

key_dict = dicts.pop(-1)

683

# can't be empty or would not exist

684

item, value = key_dict.iteritems().next()

685

if type(value) == dict:

686

# push keys

687

dicts.extend(key_dict.itervalues())

688

else:

689

# yield keys

690

for value in key_dict.itervalues():

691

# each value is the key:value:node refs tuple

692

# ready to yield.

693

yield (self, ) + value

694

else:

695

# the last thing looked up was a terminal element

696

yield (self, ) + key_dict

697

698

def key_count(self):

699

"""Return an estimate of the number of keys in this index.

700

701

For GraphIndex the estimate is exact.

702

"""

703

if self._key_count is None:

704

self._read_and_parse([_HEADER_READV])

705

return self._key_count

706

707

def _lookup_keys_via_location(self, location_keys):

708

"""Public interface for implementing bisection.

709

710

If _buffer_all has been called, then all the data for the index is in

711

memory, and this method should not be called, as it uses a separate

712

cache because it cannot pre-resolve all indices, which buffer_all does

713

for performance.

714

715

:param location_keys: A list of location(byte offset), key tuples.

716

:return: A list of (location_key, result) tuples as expected by

717

bzrlib.bisect_multi.bisect_multi_bytes.

718

"""

719

# Possible improvements:

720

# - only bisect lookup each key once

721

# - sort the keys first, and use that to reduce the bisection window

722

# -----

723

# this progresses in three parts:

724

# read data

725

# parse it

726

# attempt to answer the question from the now in memory data.

727

# build the readv request

728

# for each location, ask for 800 bytes - much more than rows we've seen

729

# anywhere.

730

readv_ranges = []

731

for location, key in location_keys:

732

# can we answer from cache?

733

if self._bisect_nodes and key in self._bisect_nodes:

734

# We have the key parsed.

735

continue

736

index = self._parsed_key_index(key)

737

if (len(self._parsed_key_map) and

738

self._parsed_key_map[index][0] <= key and

739

(self._parsed_key_map[index][1] >= key or

740

# end of the file has been parsed

741

self._parsed_byte_map[index][1] == self._size)):

742

# the key has been parsed, so no lookup is needed even if its

743

# not present.

744

continue

745

# - if we have examined this part of the file already - yes

746

index = self._parsed_byte_index(location)

747

if (len(self._parsed_byte_map) and

748

self._parsed_byte_map[index][0] <= location and

749

self._parsed_byte_map[index][1] > location):

750

# the byte region has been parsed, so no read is needed.

751

continue

752

length = 800

753

if location + length > self._size:

754

length = self._size - location

755

# todo, trim out parsed locations.

756

if length > 0:

757

readv_ranges.append((location, length))

758

# read the header if needed

759

if self._bisect_nodes is None:

760

readv_ranges.append(_HEADER_READV)

761

self._read_and_parse(readv_ranges)

762

result = []

763

if self._nodes is not None:

764

# _read_and_parse triggered a _buffer_all because we requested the

765

# whole data range

766

for location, key in location_keys:

767

if key not in self._nodes: # not present

768

result.append(((location, key), False))

769

elif self.node_ref_lists:

770

value, refs = self._nodes[key]

771

result.append(((location, key),

772

(self, key, value, refs)))

773

else:

774

result.append(((location, key),

775

(self, key, self._nodes[key])))

776

return result

777

# generate results:

778

# - figure out <, >, missing, present

779

# - result present references so we can return them.

780

# keys that we cannot answer until we resolve references

781

pending_references = []

782

pending_locations = set()

783

for location, key in location_keys:

784

# can we answer from cache?

785

if key in self._bisect_nodes:

786

# the key has been parsed, so no lookup is needed

787

if self.node_ref_lists:

788

# the references may not have been all parsed.

789

value, refs = self._bisect_nodes[key]

790

wanted_locations = []

791

for ref_list in refs:

792

for ref in ref_list:

793

if ref not in self._keys_by_offset:

794

wanted_locations.append(ref)

795

if wanted_locations:

796

pending_locations.update(wanted_locations)

797

pending_references.append((location, key))

798

continue

799

result.append(((location, key), (self, key,

800

value, self._resolve_references(refs))))

801

else:

802

result.append(((location, key),

803

(self, key, self._bisect_nodes[key])))

804

continue

805

else:

806

# has the region the key should be in, been parsed?

807

index = self._parsed_key_index(key)

808

if (self._parsed_key_map[index][0] <= key and

809

(self._parsed_key_map[index][1] >= key or

810

# end of the file has been parsed

811

self._parsed_byte_map[index][1] == self._size)):

812

result.append(((location, key), False))

813

continue

814

# no, is the key above or below the probed location:

815

# get the range of the probed & parsed location

816

index = self._parsed_byte_index(location)

817

# if the key is below the start of the range, its below

818

if key < self._parsed_key_map[index][0]:

819

direction = -1

820

else:

821

direction = +1

822

result.append(((location, key), direction))

823

readv_ranges = []

824

# lookup data to resolve references

825

for location in pending_locations:

826

length = 800

827

if location + length > self._size:

828

length = self._size - location

829

# TODO: trim out parsed locations (e.g. if the 800 is into the

830

# parsed region trim it, and dont use the adjust_for_latency

831

# facility)

832

if length > 0:

833

readv_ranges.append((location, length))

834

self._read_and_parse(readv_ranges)

835

if self._nodes is not None:

836

# The _read_and_parse triggered a _buffer_all, grab the data and

837

# return it

838

for location, key in pending_references:

839

value, refs = self._nodes[key]

840

result.append(((location, key), (self, key, value, refs)))

841

return result

842

for location, key in pending_references:

843

# answer key references we had to look-up-late.

844

value, refs = self._bisect_nodes[key]

845

result.append(((location, key), (self, key,

846

value, self._resolve_references(refs))))

847

return result

848

849

def _parse_header_from_bytes(self, bytes):

850

"""Parse the header from a region of bytes.

851

852

:param bytes: The data to parse.

853

:return: An offset, data tuple such as readv yields, for the unparsed

854

data. (which may length 0).

855

"""

856

signature = bytes[0:len(self._signature())]

857

if not signature == self._signature():

858

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

859

lines = bytes[len(self._signature()):].splitlines()

860

options_line = lines[0]

861

if not options_line.startswith(_OPTION_NODE_REFS):

862

raise errors.BadIndexOptions(self)

863

try:

864

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

865

except ValueError:

866

raise errors.BadIndexOptions(self)

867

options_line = lines[1]

868

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

869

raise errors.BadIndexOptions(self)

870

try:

871

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

872

except ValueError:

873

raise errors.BadIndexOptions(self)

874

options_line = lines[2]

875

if not options_line.startswith(_OPTION_LEN):

876

raise errors.BadIndexOptions(self)

877

try:

878

self._key_count = int(options_line[len(_OPTION_LEN):])

879

except ValueError:

880

raise errors.BadIndexOptions(self)

881

# calculate the bytes we have processed

882

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

883

len(lines[2]) + 3)

884

self._parsed_bytes(0, None, header_end, None)

885

# setup parsing state

886

self._expected_elements = 3 + self._key_length

887

# raw data keyed by offset

888

self._keys_by_offset = {}

889

# keys with the value and node references

890

self._bisect_nodes = {}

891

return header_end, bytes[header_end:]

892

893

def _parse_region(self, offset, data):

894

"""Parse node data returned from a readv operation.

895

896

:param offset: The byte offset the data starts at.

897

:param data: The data to parse.

898

"""

899

# trim the data.

900

# end first:

901

end = offset + len(data)

902

high_parsed = offset

903

while True:

904

# Trivial test - if the current index's end is within the

905

# low-matching parsed range, we're done.

906

index = self._parsed_byte_index(high_parsed)

907

if end < self._parsed_byte_map[index][1]:

908

return

909

# print "[%d:%d]" % (offset, end), \

910

# self._parsed_byte_map[index:index + 2]

911

high_parsed, last_segment = self._parse_segment(

912

offset, data, end, index)

913

if last_segment:

914

return

915

916

def _parse_segment(self, offset, data, end, index):

917

"""Parse one segment of data.

918

919

:param offset: Where 'data' begins in the file.

920

:param data: Some data to parse a segment of.

921

:param end: Where data ends

922

:param index: The current index into the parsed bytes map.

923

:return: True if the parsed segment is the last possible one in the

924

range of data.

925

:return: high_parsed_byte, last_segment.

926

high_parsed_byte is the location of the highest parsed byte in this

927

segment, last_segment is True if the parsed segment is the last

928

possible one in the data block.

929

"""

930

# default is to use all data

931

trim_end = None

932

# accomodate overlap with data before this.

933

if offset < self._parsed_byte_map[index][1]:

934

# overlaps the lower parsed region

935

# skip the parsed data

936

trim_start = self._parsed_byte_map[index][1] - offset

937

# don't trim the start for \n

938

start_adjacent = True

939

elif offset == self._parsed_byte_map[index][1]:

940

# abuts the lower parsed region

941

# use all data

942

trim_start = None

943

# do not trim anything

944

start_adjacent = True

945

else:

946

# does not overlap the lower parsed region

947

# use all data

948

trim_start = None

949

# but trim the leading \n

950

start_adjacent = False

951

if end == self._size:

952

# lines up to the end of all data:

953

# use it all

954

trim_end = None

955

# do not strip to the last \n

956

end_adjacent = True

957

last_segment = True

958

elif index + 1 == len(self._parsed_byte_map):

959

# at the end of the parsed data

960

# use it all

961

trim_end = None

962

# but strip to the last \n

963

end_adjacent = False

964

last_segment = True

965

elif end == self._parsed_byte_map[index + 1][0]:

966

# buts up against the next parsed region

967

# use it all

968

trim_end = None

969

# do not strip to the last \n

970

end_adjacent = True

971

last_segment = True

972

elif end > self._parsed_byte_map[index + 1][0]:

973

# overlaps into the next parsed region

974

# only consider the unparsed data

975

trim_end = self._parsed_byte_map[index + 1][0] - offset

976

# do not strip to the last \n as we know its an entire record

977

end_adjacent = True

978

last_segment = end < self._parsed_byte_map[index + 1][1]

979

else:

980

# does not overlap into the next region

981

# use it all

982

trim_end = None

983

# but strip to the last \n

984

end_adjacent = False

985

last_segment = True

986

# now find bytes to discard if needed

987

if not start_adjacent:

988

# work around python bug in rfind

989

if trim_start is None:

990

trim_start = data.find('\n') + 1

991

else:

992

trim_start = data.find('\n', trim_start) + 1

993

if not (trim_start != 0):

994

raise AssertionError('no \n was present')

995

# print 'removing start', offset, trim_start, repr(data[:trim_start])

996

if not end_adjacent:

997

# work around python bug in rfind

998

if trim_end is None:

999

trim_end = data.rfind('\n') + 1

1000

else:

1001

trim_end = data.rfind('\n', None, trim_end) + 1

1002

if not (trim_end != 0):

1003

raise AssertionError('no \n was present')

1004

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1005

# adjust offset and data to the parseable data.

1006

trimmed_data = data[trim_start:trim_end]

1007

if not (trimmed_data):

1008

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1009

% (trim_start, trim_end, offset, offset + len(data)))

1010

if trim_start:

1011

offset += trim_start

1012

# print "parsing", repr(trimmed_data)

1013

# splitlines mangles the \r delimiters.. don't use it.

1014

lines = trimmed_data.split('\n')

1015

del lines[-1]

1016

pos = offset

1017

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1018

for key, value in nodes:

1019

self._bisect_nodes[key] = value

1020

self._parsed_bytes(offset, first_key,

1021

offset + len(trimmed_data), last_key)

1022

return offset + len(trimmed_data), last_segment

1023

1024

def _parse_lines(self, lines, pos):

1025

key = None

1026

first_key = None

1027

trailers = 0

1028

nodes = []

1029

for line in lines:

1030

if line == '':

1031

# must be at the end

1032

if self._size:

1033

if not (self._size == pos + 1):

1034

raise AssertionError("%s %s" % (self._size, pos))

1035

trailers += 1

1036

continue

1037

elements = line.split('\0')

1038

if len(elements) != self._expected_elements:

1039

raise errors.BadIndexData(self)

1040

# keys are tuples. Each element is a string that may occur many

1041

# times, so we intern them to save space. AB, RC, 200807

1042

key = tuple([intern(element) for element in elements[:self._key_length]])

1043

if first_key is None:

1044

first_key = key

1045

absent, references, value = elements[-3:]

1046

ref_lists = []

1047

for ref_string in references.split('\t'):

1048

ref_lists.append(tuple([

1049

int(ref) for ref in ref_string.split('\r') if ref

1050

]))

1051

ref_lists = tuple(ref_lists)

1052

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1053

pos += len(line) + 1 # +1 for the \n

1054

if absent:

1055

continue

1056

if self.node_ref_lists:

1057

node_value = (value, ref_lists)

1058

else:

1059

node_value = value

1060

nodes.append((key, node_value))

1061

# print "parsed ", key

1062

return first_key, key, nodes, trailers

1063

1064

def _parsed_bytes(self, start, start_key, end, end_key):

1065

"""Mark the bytes from start to end as parsed.

1066

1067

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1068

1) as parsed.

1069

1070

:param start: The start of the parsed region.

1071

:param end: The end of the parsed region.

1072

"""

1073

index = self._parsed_byte_index(start)

1074

new_value = (start, end)

1075

new_key = (start_key, end_key)

1076

if index == -1:

1077

# first range parsed is always the beginning.

1078

self._parsed_byte_map.insert(index, new_value)

1079

self._parsed_key_map.insert(index, new_key)

1080

return

1081

# four cases:

1082

# new region

1083

# extend lower region

1084

# extend higher region

1085

# combine two regions

1086

if (index + 1 < len(self._parsed_byte_map) and

1087

self._parsed_byte_map[index][1] == start and

1088

self._parsed_byte_map[index + 1][0] == end):

1089

# combine two regions

1090

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1091

self._parsed_byte_map[index + 1][1])

1092

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1093

self._parsed_key_map[index + 1][1])

1094

del self._parsed_byte_map[index + 1]

1095

del self._parsed_key_map[index + 1]

1096

elif self._parsed_byte_map[index][1] == start:

1097

# extend the lower entry

1098

self._parsed_byte_map[index] = (

1099

self._parsed_byte_map[index][0], end)

1100

self._parsed_key_map[index] = (

1101

self._parsed_key_map[index][0], end_key)

1102

elif (index + 1 < len(self._parsed_byte_map) and

1103

self._parsed_byte_map[index + 1][0] == end):

1104

# extend the higher entry

1105

self._parsed_byte_map[index + 1] = (

1106

start, self._parsed_byte_map[index + 1][1])

1107

self._parsed_key_map[index + 1] = (

1108

start_key, self._parsed_key_map[index + 1][1])

1109

else:

1110

# new entry

1111

self._parsed_byte_map.insert(index + 1, new_value)

1112

self._parsed_key_map.insert(index + 1, new_key)

1113

1114

def _read_and_parse(self, readv_ranges):

1115

"""Read the the ranges and parse the resulting data.

1116

1117

:param readv_ranges: A prepared readv range list.

1118

"""

1119

if not readv_ranges:

1120

return

1121

if self._nodes is None and self._bytes_read * 2 >= self._size:

1122

# We've already read more than 50% of the file and we are about to

1123

# request more data, just _buffer_all() and be done

1124

self._buffer_all()

1125

return

1126

1127

readv_data = self._transport.readv(self._name, readv_ranges, True,

1128

self._size)

1129

# parse

1130

for offset, data in readv_data:

1131

self._bytes_read += len(data)

1132

if offset == 0 and len(data) == self._size:

1133

# We read the whole range, most likely because the

1134

# Transport upcast our readv ranges into one long request

1135

# for enough total data to grab the whole index.

1136

self._buffer_all(StringIO(data))

1137

return

1138

if self._bisect_nodes is None:

1139

# this must be the start

1140

if not (offset == 0):

1141

raise AssertionError()

1142

offset, data = self._parse_header_from_bytes(data)

1143

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1144

self._parse_region(offset, data)

1145

1146

def _signature(self):

1147

"""The file signature for this index type."""

1148

return _SIGNATURE

1149

1150

def validate(self):

1151

"""Validate that everything in the index can be accessed."""

1152

# iter_all validates completely at the moment, so just do that.

1153

for node in self.iter_all_entries():

1154

pass

1155

1156

1157

class CombinedGraphIndex(object):

1158

"""A GraphIndex made up from smaller GraphIndices.

1159

1160

The backing indices must implement GraphIndex, and are presumed to be

1161

static data.

1162

1163

Queries against the combined index will be made against the first index,

1164

and then the second and so on. The order of index's can thus influence

1165

performance significantly. For example, if one index is on local disk and a

1166

second on a remote server, the local disk index should be before the other

1167

in the index list.

1168

"""

1169

1170

def __init__(self, indices, reload_func=None):

1171

"""Create a CombinedGraphIndex backed by indices.

1172

1173

:param indices: An ordered list of indices to query for data.

1174

:param reload_func: A function to call if we find we are missing an

1175

index. Should have the form reload_func() => True/False to indicate

1176

if reloading actually changed anything.

1177

"""

1178

self._indices = indices

1179

self._reload_func = reload_func

1180

1181

def __repr__(self):

1182

return "%s(%s)" % (

1183

self.__class__.__name__,

1184

', '.join(map(repr, self._indices)))

1185

1186

def get_parent_map(self, keys):

1187

"""See graph._StackedParentsProvider.get_parent_map"""

1188

search_keys = set(keys)

1189

if NULL_REVISION in search_keys:

1190

search_keys.discard(NULL_REVISION)

1191

found_parents = {NULL_REVISION:[]}

1192

else:

1193

found_parents = {}

1194

for index, key, value, refs in self.iter_entries(search_keys):

1195

parents = refs[0]

1196

if not parents:

1197

parents = (NULL_REVISION,)

1198

found_parents[key] = parents

1199

return found_parents

1200

1201

has_key = _has_key_from_parent_map

1202

1203

def insert_index(self, pos, index):

1204

"""Insert a new index in the list of indices to query.

1205

1206

:param pos: The position to insert the index.

1207

:param index: The index to insert.

1208

"""

1209

self._indices.insert(pos, index)

1210

1211

def iter_all_entries(self):

1212

"""Iterate over all keys within the index

1213

1214

Duplicate keys across child indices are presumed to have the same

1215

value and are only reported once.

1216

1217

:return: An iterable of (index, key, reference_lists, value).

1218

There is no defined order for the result iteration - it will be in

1219

the most efficient order for the index.

1220

"""

1221

seen_keys = set()

1222

while True:

1223

try:

1224

for index in self._indices:

1225

for node in index.iter_all_entries():

1226

if node[1] not in seen_keys:

1227

yield node

1228

seen_keys.add(node[1])

1229

return

1230

except errors.NoSuchFile:

1231

self._reload_or_raise()

1232

1233

def iter_entries(self, keys):

1234

"""Iterate over keys within the index.

1235

1236

Duplicate keys across child indices are presumed to have the same

1237

value and are only reported once.

1238

1239

:param keys: An iterable providing the keys to be retrieved.

1240

:return: An iterable of (index, key, reference_lists, value). There is no

1241

defined order for the result iteration - it will be in the most

1242

efficient order for the index.

1243

"""

1244

keys = set(keys)

1245

while True:

1246

try:

1247

for index in self._indices:

1248

if not keys:

1249

return

1250

for node in index.iter_entries(keys):

1251

keys.remove(node[1])

1252

yield node

1253

return

1254

except errors.NoSuchFile:

1255

self._reload_or_raise()

1256

1257

def iter_entries_prefix(self, keys):

1258

"""Iterate over keys within the index using prefix matching.

1259

1260

Duplicate keys across child indices are presumed to have the same

1261

value and are only reported once.

1262

1263

Prefix matching is applied within the tuple of a key, not to within

1264

the bytestring of each key element. e.g. if you have the keys ('foo',

1265

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1266

only the former key is returned.

1267

1268

:param keys: An iterable providing the key prefixes to be retrieved.

1269

Each key prefix takes the form of a tuple the length of a key, but

1270

with the last N elements 'None' rather than a regular bytestring.

1271

The first element cannot be 'None'.

1272

:return: An iterable as per iter_all_entries, but restricted to the

1273

keys with a matching prefix to those supplied. No additional keys

1274

will be returned, and every match that is in the index will be

1275

returned.

1276

"""

1277

keys = set(keys)

1278

if not keys:

1279

return

1280

seen_keys = set()

1281

while True:

1282

try:

1283

for index in self._indices:

1284

for node in index.iter_entries_prefix(keys):

1285

if node[1] in seen_keys:

1286

continue

1287

seen_keys.add(node[1])

1288

yield node

1289

return

1290

except errors.NoSuchFile:

1291

self._reload_or_raise()

1292

1293

def key_count(self):

1294

"""Return an estimate of the number of keys in this index.

1295

1296

For CombinedGraphIndex this is approximated by the sum of the keys of

1297

the child indices. As child indices may have duplicate keys this can

1298

have a maximum error of the number of child indices * largest number of

1299

keys in any index.

1300

"""

1301

while True:

1302

try:

1303

return sum((index.key_count() for index in self._indices), 0)

1304

except errors.NoSuchFile:

1305

self._reload_or_raise()

1306

1307

missing_keys = _missing_keys_from_parent_map

1308

1309

def _reload_or_raise(self):

1310

"""We just got a NoSuchFile exception.

1311

1312

Try to reload the indices, if it fails, just raise the current

1313

exception.

1314

"""

1315

if self._reload_func is None:

1316

raise

1317

exc_type, exc_value, exc_traceback = sys.exc_info()

1318

trace.mutter('Trying to reload after getting exception: %s',

1319

exc_value)

1320

if not self._reload_func():

1321

# We tried to reload, but nothing changed, so we fail anyway

1322

trace.mutter('_reload_func indicated nothing has changed.'

1323

' Raising original exception.')

1324

raise exc_type, exc_value, exc_traceback

1325

1326

def validate(self):

1327

"""Validate that everything in the index can be accessed."""

1328

while True:

1329

try:

1330

for index in self._indices:

1331

index.validate()

1332

return

1333

except errors.NoSuchFile:

1334

self._reload_or_raise()

1335

1336

1337

class InMemoryGraphIndex(GraphIndexBuilder):

1338

"""A GraphIndex which operates entirely out of memory and is mutable.

1339

1340

This is designed to allow the accumulation of GraphIndex entries during a

1341

single write operation, where the accumulated entries need to be immediately

1342

available - for example via a CombinedGraphIndex.

1343

"""

1344

1345

def add_nodes(self, nodes):

1346

"""Add nodes to the index.

1347

1348

:param nodes: An iterable of (key, node_refs, value) entries to add.

1349

"""

1350

if self.reference_lists:

1351

for (key, value, node_refs) in nodes:

1352

self.add_node(key, value, node_refs)

1353

else:

1354

for (key, value) in nodes:

1355

self.add_node(key, value)

1356

1357

def iter_all_entries(self):

1358

"""Iterate over all keys within the index

1359

1360

:return: An iterable of (index, key, reference_lists, value). There is no

1361

defined order for the result iteration - it will be in the most

1362

efficient order for the index (in this case dictionary hash order).

1363

"""

1364

if 'evil' in debug.debug_flags:

1365

trace.mutter_callsite(3,

1366

"iter_all_entries scales with size of history.")

1367

if self.reference_lists:

1368

for key, (absent, references, value) in self._nodes.iteritems():

1369

if not absent:

1370

yield self, key, value, references

1371

else:

1372

for key, (absent, references, value) in self._nodes.iteritems():

1373

if not absent:

1374

yield self, key, value

1375

1376

def iter_entries(self, keys):

1377

"""Iterate over keys within the index.

1378

1379

:param keys: An iterable providing the keys to be retrieved.

1380

:return: An iterable of (index, key, value, reference_lists). There is no

1381

defined order for the result iteration - it will be in the most

1382

efficient order for the index (keys iteration order in this case).

1383

"""

1384

keys = set(keys)

1385

if self.reference_lists:

1386

for key in keys.intersection(self._keys):

1387

node = self._nodes[key]

1388

if not node[0]:

1389

yield self, key, node[2], node[1]

1390

else:

1391

for key in keys.intersection(self._keys):

1392

node = self._nodes[key]

1393

if not node[0]:

1394

yield self, key, node[2]

1395

1396

def iter_entries_prefix(self, keys):

1397

"""Iterate over keys within the index using prefix matching.

1398

1399

Prefix matching is applied within the tuple of a key, not to within

1400

the bytestring of each key element. e.g. if you have the keys ('foo',

1401

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1402

only the former key is returned.

1403

1404

:param keys: An iterable providing the key prefixes to be retrieved.

1405

Each key prefix takes the form of a tuple the length of a key, but

1406

with the last N elements 'None' rather than a regular bytestring.

1407

The first element cannot be 'None'.

1408

:return: An iterable as per iter_all_entries, but restricted to the

1409

keys with a matching prefix to those supplied. No additional keys

1410

will be returned, and every match that is in the index will be

1411

returned.

1412

"""

1413

# XXX: To much duplication with the GraphIndex class; consider finding

1414

# a good place to pull out the actual common logic.

1415

keys = set(keys)

1416

if not keys:

1417

return

1418

if self._key_length == 1:

1419

for key in keys:

1420

# sanity check

1421

if key[0] is None:

1422

raise errors.BadIndexKey(key)

1423

if len(key) != self._key_length:

1424

raise errors.BadIndexKey(key)

1425

node = self._nodes[key]

1426

if node[0]:

1427

continue

1428

if self.reference_lists:

1429

yield self, key, node[2], node[1]

1430

else:

1431

yield self, key, node[2]

1432

return

1433

nodes_by_key = self._get_nodes_by_key()

1434

for key in keys:

1435

# sanity check

1436

if key[0] is None:

1437

raise errors.BadIndexKey(key)

1438

if len(key) != self._key_length:

1439

raise errors.BadIndexKey(key)

1440

# find what it refers to:

1441

key_dict = nodes_by_key

1442

elements = list(key)

1443

# find the subdict to return

1444

try:

1445

while len(elements) and elements[0] is not None:

1446

key_dict = key_dict[elements[0]]

1447

elements.pop(0)

1448

except KeyError:

1449

# a non-existant lookup.

1450

continue

1451

if len(elements):

1452

dicts = [key_dict]

1453

while dicts:

1454

key_dict = dicts.pop(-1)

1455

# can't be empty or would not exist

1456

item, value = key_dict.iteritems().next()

1457

if type(value) == dict:

1458

# push keys

1459

dicts.extend(key_dict.itervalues())

1460

else:

1461

# yield keys

1462

for value in key_dict.itervalues():

1463

yield (self, ) + value

1464

else:

1465

yield (self, ) + key_dict

1466

1467

def key_count(self):

1468

"""Return an estimate of the number of keys in this index.

1469

1470

For InMemoryGraphIndex the estimate is exact.

1471

"""

1472

return len(self._keys)

1473

1474

def validate(self):

1475

"""In memory index's have no known corruption at the moment."""

1476

1477

1478

class GraphIndexPrefixAdapter(object):

1479

"""An adapter between GraphIndex with different key lengths.

1480

1481

Queries against this will emit queries against the adapted Graph with the

1482

prefix added, queries for all items use iter_entries_prefix. The returned

1483

nodes will have their keys and node references adjusted to remove the

1484

prefix. Finally, an add_nodes_callback can be supplied - when called the

1485

nodes and references being added will have prefix prepended.

1486

"""

1487

1488

def __init__(self, adapted, prefix, missing_key_length,

1489

add_nodes_callback=None):

1490

"""Construct an adapter against adapted with prefix."""

1491

self.adapted = adapted

1492

self.prefix_key = prefix + (None,)*missing_key_length

1493

self.prefix = prefix

1494

self.prefix_len = len(prefix)

1495

self.add_nodes_callback = add_nodes_callback

1496

1497

def add_nodes(self, nodes):

1498

"""Add nodes to the index.

1499

1500

:param nodes: An iterable of (key, node_refs, value) entries to add.

1501

"""

1502

# save nodes in case its an iterator

1503

nodes = tuple(nodes)

1504

translated_nodes = []

1505

try:

1506

# Add prefix_key to each reference node_refs is a tuple of tuples,

1507

# so split it apart, and add prefix_key to the internal reference

1508

for (key, value, node_refs) in nodes:

1509

adjusted_references = (

1510

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1511

for ref_list in node_refs))

1512

translated_nodes.append((self.prefix + key, value,

1513

adjusted_references))

1514

except ValueError:

1515

# XXX: TODO add an explicit interface for getting the reference list

1516

# status, to handle this bit of user-friendliness in the API more

1517

# explicitly.

1518

for (key, value) in nodes:

1519

translated_nodes.append((self.prefix + key, value))

1520

self.add_nodes_callback(translated_nodes)

1521

1522

def add_node(self, key, value, references=()):

1523

"""Add a node to the index.

1524

1525

:param key: The key. keys are non-empty tuples containing

1526

as many whitespace-free utf8 bytestrings as the key length

1527

defined for this index.

1528

:param references: An iterable of iterables of keys. Each is a

1529

reference to another key.

1530

:param value: The value to associate with the key. It may be any

1531

bytes as long as it does not contain \0 or \n.

1532

"""

1533

self.add_nodes(((key, value, references), ))

1534

1535

def _strip_prefix(self, an_iter):

1536

"""Strip prefix data from nodes and return it."""

1537

for node in an_iter:

1538

# cross checks

1539

if node[1][:self.prefix_len] != self.prefix:

1540

raise errors.BadIndexData(self)

1541

for ref_list in node[3]:

1542

for ref_node in ref_list:

1543

if ref_node[:self.prefix_len] != self.prefix:

1544

raise errors.BadIndexData(self)

1545

yield node[0], node[1][self.prefix_len:], node[2], (

1546

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1547

for ref_list in node[3]))

1548

1549

def iter_all_entries(self):

1550

"""Iterate over all keys within the index

1551

1552

iter_all_entries is implemented against the adapted index using

1553

iter_entries_prefix.

1554

1555

:return: An iterable of (index, key, reference_lists, value). There is no

1556

defined order for the result iteration - it will be in the most

1557

efficient order for the index (in this case dictionary hash order).

1558

"""

1559

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1560

1561

def iter_entries(self, keys):

1562

"""Iterate over keys within the index.

1563

1564

:param keys: An iterable providing the keys to be retrieved.

1565

:return: An iterable of (index, key, value, reference_lists). There is no

1566

defined order for the result iteration - it will be in the most

1567

efficient order for the index (keys iteration order in this case).

1568

"""

1569

return self._strip_prefix(self.adapted.iter_entries(

1570

self.prefix + key for key in keys))

1571

1572

def iter_entries_prefix(self, keys):

1573

"""Iterate over keys within the index using prefix matching.

1574

1575

Prefix matching is applied within the tuple of a key, not to within

1576

the bytestring of each key element. e.g. if you have the keys ('foo',

1577

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1578

only the former key is returned.

1579

1580

:param keys: An iterable providing the key prefixes to be retrieved.

1581

Each key prefix takes the form of a tuple the length of a key, but

1582

with the last N elements 'None' rather than a regular bytestring.

1583

The first element cannot be 'None'.

1584

:return: An iterable as per iter_all_entries, but restricted to the

1585

keys with a matching prefix to those supplied. No additional keys

1586

will be returned, and every match that is in the index will be

1587

returned.

1588

"""

1589

return self._strip_prefix(self.adapted.iter_entries_prefix(

1590

self.prefix + key for key in keys))

1591

1592

def key_count(self):

1593

"""Return an estimate of the number of keys in this index.

1594

1595

For GraphIndexPrefixAdapter this is relatively expensive - key

1596

iteration with the prefix is done.

1597

"""

1598

return len(list(self.iter_all_entries()))

1599

1600

def validate(self):

1601

"""Call the adapted's validate."""

1602

self.adapted.validate()

Older »