/brz/remove-bazaar : revision 2592.3.169

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Robert Collins
Date: 2007-10-08 04:53:50 UTC
mfrom: (2890.1.2 readv)
mto: This revision was merged to the branch mainline in revision 2933.
Revision ID: robertc@robertcollins.net-20071008045350-qwh1gb3r9vy3c8kk

Readv fixes.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics.py

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/multiparent.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/HttpServer.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/last-modified.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/user-guide

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/centralized_workflow.txt

doc/en/user-guide/configuration.txt

doc/en/user-guide/conflicts.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/tutorial.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/version_info.txt

doc/en/user-reference

doc/en/user-reference/hooks.txt

doc/en/user-reference/index.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

tools/win32/survey.txt

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.trace import mutter

""")

from bzrlib import debug, errors

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

self._nodes = {}

self._nodes_by_key = {}

self._key_length = key_elements

def _check_key(self, key):

"""Raise BadIndexKey if key is not a valid key for this index."""

if type(key) != tuple:

raise errors.BadIndexKey(key)

if self._key_length != len(key):

raise errors.BadIndexKey(key)

for element in key:

if not element or _whitespace_re.search(element) is not None:

raise errors.BadIndexKey(element)

def add_node(self, key, value, references=()):

"""Add a node to the index.

:param key: The key. keys are non-empty tuples containing

as many whitespace-free utf8 bytestrings as the key length

defined for this index.

:param references: An iterable of iterables of keys. Each is a

reference to another key.

:param value: The value to associate with the key. It may be any

100

bytes as long as it does not contain \0 or \n.

101

"""

102

self._check_key(key)

103

if _newline_null_re.search(value) is not None:

104

raise errors.BadIndexValue(value)

105

if len(references) != self.reference_lists:

106

raise errors.BadIndexValue(references)

107

node_refs = []

108

for reference_list in references:

109

for reference in reference_list:

110

self._check_key(reference)

111

if reference not in self._nodes:

112

self._nodes[reference] = ('a', (), '')

113

node_refs.append(tuple(reference_list))

114

if key in self._nodes and self._nodes[key][0] == '':

115

raise errors.BadIndexDuplicateKey(key, self)

116

self._nodes[key] = ('', tuple(node_refs), value)

117

self._keys.add(key)

118

if self._key_length > 1:

119

key_dict = self._nodes_by_key

120

if self.reference_lists:

121

key_value = key, value, tuple(node_refs)

122

else:

123

key_value = key, value

124

# possibly should do this on-demand, but it seems likely it is

125

# always wanted

126

# For a key of (foo, bar, baz) create

127

# _nodes_by_key[foo][bar][baz] = key_value

128

for subkey in key[:-1]:

129

key_dict = key_dict.setdefault(subkey, {})

130

key_dict[key[-1]] = key_value

131

132

def finish(self):

133

lines = [_SIGNATURE]

134

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

135

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

136

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

137

prefix_length = sum(len(x) for x in lines)

138

# references are byte offsets. To avoid having to do nasty

139

# polynomial work to resolve offsets (references to later in the

140

# file cannot be determined until all the inbetween references have

141

# been calculated too) we pad the offsets with 0's to make them be

142

# of consistent length. Using binary offsets would break the trivial

143

# file parsing.

144

# to calculate the width of zero's needed we do three passes:

145

# one to gather all the non-reference data and the number of references.

146

# one to pad all the data with reference-length and determine entry

147

# addresses.

148

# One to serialise.

149

150

# forward sorted by key. In future we may consider topological sorting,

151

# at the cost of table scans for direct lookup, or a second index for

152

# direct lookup

153

nodes = sorted(self._nodes.items())

154

# if we do not prepass, we don't know how long it will be up front.

155

expected_bytes = None

156

# we only need to pre-pass if we have reference lists at all.

157

if self.reference_lists:

158

key_offset_info = []

159

non_ref_bytes = prefix_length

160

total_references = 0

161

# TODO use simple multiplication for the constants in this loop.

162

for key, (absent, references, value) in nodes:

163

# record the offset known *so far* for this key:

164

# the non reference bytes to date, and the total references to

165

# date - saves reaccumulating on the second pass

166

key_offset_info.append((key, non_ref_bytes, total_references))

167

# key is literal, value is literal, there are 3 null's, 1 NL

168

# key is variable length tuple, \x00 between elements

169

non_ref_bytes += sum(len(element) for element in key)

170

if self._key_length > 1:

171

non_ref_bytes += self._key_length - 1

172

# value is literal bytes, there are 3 null's, 1 NL.

173

non_ref_bytes += len(value) + 3 + 1

174

# one byte for absent if set.

175

if absent:

176

non_ref_bytes += 1

177

elif self.reference_lists:

178

# (ref_lists -1) tabs

179

non_ref_bytes += self.reference_lists - 1

180

# (ref-1 cr's per ref_list)

181

for ref_list in references:

182

# how many references across the whole file?

183

total_references += len(ref_list)

184

# accrue reference separators

185

if ref_list:

186

non_ref_bytes += len(ref_list) - 1

187

# how many digits are needed to represent the total byte count?

188

digits = 1

189

possible_total_bytes = non_ref_bytes + total_references*digits

190

while 10 ** digits < possible_total_bytes:

191

digits += 1

192

possible_total_bytes = non_ref_bytes + total_references*digits

193

expected_bytes = possible_total_bytes + 1 # terminating newline

194

# resolve key addresses.

195

key_addresses = {}

196

for key, non_ref_bytes, total_references in key_offset_info:

197

key_addresses[key] = non_ref_bytes + total_references*digits

198

# serialise

199

format_string = '%%0%sd' % digits

200

for key, (absent, references, value) in nodes:

201

flattened_references = []

202

for ref_list in references:

203

ref_addresses = []

204

for reference in ref_list:

205

ref_addresses.append(format_string % key_addresses[reference])

206

flattened_references.append('\r'.join(ref_addresses))

207

string_key = '\x00'.join(key)

208

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

209

'\t'.join(flattened_references), value))

210

lines.append('\n')

211

result = StringIO(''.join(lines))

212

if expected_bytes and len(result.getvalue()) != expected_bytes:

213

raise errors.BzrError('Failed index creation. Internal error:'

214

' mismatched output length and expected length: %d %d' %

215

(len(result.getvalue()), expected_bytes))

216

return StringIO(''.join(lines))

217

218

219

class GraphIndex(object):

220

"""An index for data with embedded graphs.

221

222

The index maps keys to a list of key reference lists, and a value.

223

Each node has the same number of key reference lists. Each key reference

224

list can be empty or an arbitrary length. The value is an opaque NULL

225

terminated string without any newlines. The storage of the index is

226

hidden in the interface: keys and key references are always tuples of

227

bytestrings, never the internal representation (e.g. dictionary offsets).

228

229

It is presumed that the index will not be mutated - it is static data.

230

231

Successive iter_all_entries calls will read the entire index each time.

232

Additionally, iter_entries calls will read the index linearly until the

233

desired keys are found. XXX: This must be fixed before the index is

234

suitable for production use. :XXX

235

"""

236

237

def __init__(self, transport, name, size):

238

"""Open an index called name on transport.

239

240

:param transport: A bzrlib.transport.Transport.

241

:param name: A path to provide to transport API calls.

242

:param size: The size of the index in bytes. This is used for bisection

243

logic to perform partial index reads. While the size could be

244

obtained by statting the file this introduced an additional round

245

trip as well as requiring stat'able transports, both of which are

246

avoided by having it supplied. If size is None, then bisection

247

support will be disabled and accessing the index will just stream

248

all the data.

249

"""

250

self._transport = transport

251

self._name = name

252

# becomes a dict of key:(value, reference-list-byte-locations)

253

# used by the bisection interface to store parsed but not resolved

254

# keys.

255

self._bisect_nodes = None

256

self._nodes = None

257

# a sorted list of slice-addresses for the parsed bytes of the file.

258

# e.g. (0,1) would mean that byte 0 is parsed.

259

self._parsed_byte_map = []

260

# a sorted list of keys matching each slice address for parsed bytes

261

# e.g. (None, 'foo@bar') would mean that the first byte contained no

262

# key, and the end byte of the slice is the of the data for 'foo@bar'

263

self._parsed_key_map = []

264

self._key_count = None

265

self._keys_by_offset = None

266

self._nodes_by_key = None

267

self._size = size

268

269

def _buffer_all(self):

270

"""Buffer all the index data.

271

272

Mutates self._nodes and self.keys_by_offset.

273

"""

274

if 'index' in debug.debug_flags:

275

mutter('Reading entire index %s', self._transport.abspath(self._name))

276

stream = self._transport.get(self._name)

277

self._read_prefix(stream)

278

expected_elements = 3 + self._key_length

279

line_count = 0

280

# raw data keyed by offset

281

self._keys_by_offset = {}

282

# ready-to-return key:value or key:value, node_ref_lists

283

self._nodes = {}

284

self._nodes_by_key = {}

285

trailers = 0

286

pos = stream.tell()

287

for line in stream.readlines():

288

if line == '\n':

289

trailers += 1

290

continue

291

elements = line.split('\0')

292

if len(elements) != expected_elements:

293

raise errors.BadIndexData(self)

294

# keys are tuples

295

key = tuple(elements[:self._key_length])

296

absent, references, value = elements[-3:]

297

value = value[:-1] # remove the newline

298

ref_lists = []

299

for ref_string in references.split('\t'):

300

ref_lists.append(tuple([

301

int(ref) for ref in ref_string.split('\r') if ref

302

]))

303

ref_lists = tuple(ref_lists)

304

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

305

pos += len(line)

306

for key, absent, references, value in self._keys_by_offset.itervalues():

307

if absent:

308

continue

309

# resolve references:

310

if self.node_ref_lists:

311

node_refs = []

312

for ref_list in references:

313

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

314

node_value = (value, tuple(node_refs))

315

else:

316

node_value = value

317

self._nodes[key] = node_value

318

if self._key_length > 1:

319

subkey = list(reversed(key[:-1]))

320

key_dict = self._nodes_by_key

321

if self.node_ref_lists:

322

key_value = key, node_value[0], node_value[1]

323

else:

324

key_value = key, node_value

325

# possibly should do this on-demand, but it seems likely it is

326

# always wanted

327

# For a key of (foo, bar, baz) create

328

# _nodes_by_key[foo][bar][baz] = key_value

329

for subkey in key[:-1]:

330

key_dict = key_dict.setdefault(subkey, {})

331

key_dict[key[-1]] = key_value

332

# cache the keys for quick set intersections

333

self._keys = set(self._nodes)

334

if trailers != 1:

335

# there must be one line - the empty trailer line.

336

raise errors.BadIndexData(self)

337

338

def iter_all_entries(self):

339

"""Iterate over all keys within the index.

340

341

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

342

The former tuple is used when there are no reference lists in the

343

index, making the API compatible with simple key:value index types.

344

There is no defined order for the result iteration - it will be in

345

the most efficient order for the index.

346

"""

347

if 'evil' in debug.debug_flags:

348

trace.mutter_callsite(3,

349

"iter_all_entries scales with size of history.")

350

if self._nodes is None:

351

self._buffer_all()

352

if self.node_ref_lists:

353

for key, (value, node_ref_lists) in self._nodes.iteritems():

354

yield self, key, value, node_ref_lists

355

else:

356

for key, value in self._nodes.iteritems():

357

yield self, key, value

358

359

def _read_prefix(self, stream):

360

signature = stream.read(len(self._signature()))

361

if not signature == self._signature():

362

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

363

options_line = stream.readline()

364

if not options_line.startswith(_OPTION_NODE_REFS):

365

raise errors.BadIndexOptions(self)

366

try:

367

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

368

except ValueError:

369

raise errors.BadIndexOptions(self)

370

options_line = stream.readline()

371

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

372

raise errors.BadIndexOptions(self)

373

try:

374

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

375

except ValueError:

376

raise errors.BadIndexOptions(self)

377

options_line = stream.readline()

378

if not options_line.startswith(_OPTION_LEN):

379

raise errors.BadIndexOptions(self)

380

try:

381

self._key_count = int(options_line[len(_OPTION_LEN):-1])

382

except ValueError:

383

raise errors.BadIndexOptions(self)

384

385

def _resolve_references(self, references):

386

"""Return the resolved key references for references."""

387

node_refs = []

388

for ref_list in references:

389

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

390

return tuple(node_refs)

391

392

def _find_index(self, range_map, key):

393

"""Helper for the _parsed_*_index calls.

394

395

Given a range map - [(start, end), ...], finds the index of the range

396

in the map for key if it is in the map, and if it is not there, the

397

immediately preceeding range in the map.

398

"""

399

result = bisect_right(range_map, key) - 1

400

if result + 1 < len(range_map):

401

# check the border condition, it may be in result + 1

402

if range_map[result + 1][0] == key[0]:

403

return result + 1

404

return result

405

406

def _parsed_byte_index(self, offset):

407

"""Return the index of the entry immediately before offset.

408

409

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

410

there is one unparsed byte (the 11th, addressed as[10]). then:

411

asking for 0 will return 0

412

asking for 10 will return 0

413

asking for 11 will return 1

414

asking for 12 will return 1

415

"""

416

key = (offset, 0)

417

return self._find_index(self._parsed_byte_map, key)

418

419

def _parsed_key_index(self, key):

420

"""Return the index of the entry immediately before key.

421

422

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

423

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

424

have been parsed, then:

425

asking for '' will return 0

426

asking for 'a' will return 0

427

asking for 'b' will return 1

428

asking for 'e' will return 1

429

"""

430

search_key = (key, None)

431

return self._find_index(self._parsed_key_map, search_key)

432

433

def _is_parsed(self, offset):

434

"""Returns True if offset has been parsed."""

435

index = self._parsed_byte_index(offset)

436

if index == len(self._parsed_byte_map):

437

return offset < self._parsed_byte_map[index - 1][1]

438

start, end = self._parsed_byte_map[index]

439

return offset >= start and offset < end

440

441

def _iter_entries_from_total_buffer(self, keys):

442

"""Iterate over keys when the entire index is parsed."""

443

keys = keys.intersection(self._keys)

444

if self.node_ref_lists:

445

for key in keys:

446

value, node_refs = self._nodes[key]

447

yield self, key, value, node_refs

448

else:

449

for key in keys:

450

yield self, key, self._nodes[key]

451

452

def iter_entries(self, keys):

453

"""Iterate over keys within the index.

454

455

:param keys: An iterable providing the keys to be retrieved.

456

:return: An iterable as per iter_all_entries, but restricted to the

457

keys supplied. No additional keys will be returned, and every

458

key supplied that is in the index will be returned.

459

"""

460

keys = set(keys)

461

if not keys:

462

return []

463

if self._size is None and self._nodes is None:

464

self._buffer_all()

465

if self._nodes is not None:

466

return self._iter_entries_from_total_buffer(keys)

467

else:

468

return (result[1] for result in bisect_multi_bytes(

469

self.lookup_keys_via_location, self._size, keys))

470

471

def iter_entries_prefix(self, keys):

472

"""Iterate over keys within the index using prefix matching.

473

474

Prefix matching is applied within the tuple of a key, not to within

475

the bytestring of each key element. e.g. if you have the keys ('foo',

476

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

477

only the former key is returned.

478

479

WARNING: Note that this method currently causes a full index parse

480

unconditionally (which is reasonably appropriate as it is a means for

481

thunking many small indices into one larger one and still supplies

482

iter_all_entries at the thunk layer).

483

484

:param keys: An iterable providing the key prefixes to be retrieved.

485

Each key prefix takes the form of a tuple the length of a key, but

486

with the last N elements 'None' rather than a regular bytestring.

487

The first element cannot be 'None'.

488

:return: An iterable as per iter_all_entries, but restricted to the

489

keys with a matching prefix to those supplied. No additional keys

490

will be returned, and every match that is in the index will be

491

returned.

492

"""

493

keys = set(keys)

494

if not keys:

495

return

496

# load data - also finds key lengths

497

if self._nodes is None:

498

self._buffer_all()

499

if self._key_length == 1:

500

for key in keys:

501

# sanity check

502

if key[0] is None:

503

raise errors.BadIndexKey(key)

504

if len(key) != self._key_length:

505

raise errors.BadIndexKey(key)

506

if self.node_ref_lists:

507

value, node_refs = self._nodes[key]

508

yield self, key, value, node_refs

509

else:

510

yield self, key, self._nodes[key]

511

return

512

for key in keys:

513

# sanity check

514

if key[0] is None:

515

raise errors.BadIndexKey(key)

516

if len(key) != self._key_length:

517

raise errors.BadIndexKey(key)

518

# find what it refers to:

519

key_dict = self._nodes_by_key

520

elements = list(key)

521

# find the subdict whose contents should be returned.

522

try:

523

while len(elements) and elements[0] is not None:

524

key_dict = key_dict[elements[0]]

525

elements.pop(0)

526

except KeyError:

527

# a non-existant lookup.

528

continue

529

if len(elements):

530

dicts = [key_dict]

531

while dicts:

532

key_dict = dicts.pop(-1)

533

# can't be empty or would not exist

534

item, value = key_dict.iteritems().next()

535

if type(value) == dict:

536

# push keys

537

dicts.extend(key_dict.itervalues())

538

else:

539

# yield keys

540

for value in key_dict.itervalues():

541

# each value is the key:value:node refs tuple

542

# ready to yield.

543

yield (self, ) + value

544

else:

545

# the last thing looked up was a terminal element

546

yield (self, ) + key_dict

547

548

def key_count(self):

549

"""Return an estimate of the number of keys in this index.

550

551

For GraphIndex the estimate is exact.

552

"""

553

if self._key_count is None:

554

# really this should just read the prefix

555

self._buffer_all()

556

return self._key_count

557

558

def lookup_keys_via_location(self, location_keys):

559

"""Public interface for implementing bisection.

560

561

If _buffer_all has been called, then all the data for the index is in

562

memory, and this method should not be called, as it uses a separate

563

cache because it cannot pre-resolve all indices, which buffer_all does

564

for performance.

565

566

:param location_keys: A list of location, key tuples.

567

:return: A list of (location_key, result) tuples as expected by

568

bzrlib.bisect_multi.bisect_multi_bytes.

569

"""

570

# Possible improvements:

571

# - only bisect lookup each key once

572

# - sort the keys first, and use that to reduce the bisection window

573

# -----

574

# this progresses in three parts:

575

# read data

576

# parse it

577

# attempt to answer the question from the now in memory data.

578

# build the readv request

579

# for each location, ask for 800 bytes - much more than rows we've seen

580

# anywhere.

581

readv_ranges = []

582

for location, key in location_keys:

583

# can we answer from cache?

584

# - if we know the answer - yes

585

index = self._parsed_key_index(key)

586

if (len(self._parsed_key_map) and

587

self._parsed_key_map[index][0] <= key and

588

(self._parsed_key_map[index][1] > key or

589

# end of the file has been parsed

590

self._parsed_byte_map[index][1] == self._size)):

591

# the key has been parsed, so no lookup is needed

592

continue

593

# - if we have examined this part of the file already - yes

594

index = self._parsed_byte_index(location)

595

if (len(self._parsed_byte_map) and

596

self._parsed_byte_map[index][0] <= location and

597

self._parsed_byte_map[index][1] > location):

598

# the byte region has been parsed, so no read is needed.

599

continue

600

length = 800

601

if location + length > self._size:

602

length = self._size - location

603

# todo, trim out parsed locations.

604

if length > 0:

605

readv_ranges.append((location, length))

606

# read the header if needed

607

if self._bisect_nodes is None:

608

readv_ranges.append((0, 200))

609

self._read_and_parse(readv_ranges)

610

# generate results:

611

# - figure out <, >, missing, present

612

# - result present references so we can return them.

613

result = []

614

# keys that we cannot answer until we resolve references

615

pending_references = []

616

pending_locations = set()

617

for location, key in location_keys:

618

# can we answer from cache?

619

index = self._parsed_key_index(key)

620

if (self._parsed_key_map[index][0] <= key and

621

(self._parsed_key_map[index][1] > key or

622

# end of the file has been parsed

623

self._parsed_byte_map[index][1] == self._size)):

624

# the key has been parsed, so no lookup is needed

625

if key in self._bisect_nodes:

626

if self.node_ref_lists:

627

# the references may not have been all parsed.

628

value, refs = self._bisect_nodes[key]

629

wanted_locations = []

630

for ref_list in refs:

631

for ref in ref_list:

632

if ref not in self._keys_by_offset:

633

wanted_locations.append(ref)

634

if wanted_locations:

635

pending_locations.update(wanted_locations)

636

pending_references.append((location, key))

637

continue

638

result.append(((location, key), (self, key,

639

value, self._resolve_references(refs))))

640

else:

641

result.append(((location, key),

642

(self, key, self._bisect_nodes[key])))

643

else:

644

result.append(((location, key), False))

645

continue

646

# no, is the key above or below the probed location:

647

# get the range of the probed & parsed location

648

index = self._parsed_byte_index(location)

649

# if the key is below the start of the range, its below

650

if key < self._parsed_key_map[index][0]:

651

direction = -1

652

else:

653

direction = +1

654

result.append(((location, key), direction))

655

readv_ranges = []

656

# lookup data to resolve references

657

for location in pending_locations:

658

length = 800

659

if location + length > self._size:

660

length = self._size - location

661

# TODO: trim out parsed locations (e.g. if the 800 is into the

662

# parsed region trim it, and dont use the ajust_for_latency

663

# facility)

664

if length > 0:

665

readv_ranges.append((location, length))

666

self._read_and_parse(readv_ranges)

667

for location, key in pending_references:

668

# answer key references we had to look-up-late.

669

index = self._parsed_key_index(key)

670

value, refs = self._bisect_nodes[key]

671

result.append(((location, key), (self, key,

672

value, self._resolve_references(refs))))

673

return result

674

675

def _parse_header_from_bytes(self, bytes):

676

"""Parse the header from a region of bytes.

677

678

:param bytes: The data to parse.

679

:return: An offset, data tuple such as readv yields, for the unparsed

680

data. (which may length 0).

681

"""

682

signature = bytes[0:len(self._signature())]

683

if not signature == self._signature():

684

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

685

lines = bytes[len(self._signature()):].splitlines()

686

options_line = lines[0]

687

if not options_line.startswith(_OPTION_NODE_REFS):

688

raise errors.BadIndexOptions(self)

689

try:

690

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

691

except ValueError:

692

raise errors.BadIndexOptions(self)

693

options_line = lines[1]

694

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

695

raise errors.BadIndexOptions(self)

696

try:

697

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

698

except ValueError:

699

raise errors.BadIndexOptions(self)

700

options_line = lines[2]

701

if not options_line.startswith(_OPTION_LEN):

702

raise errors.BadIndexOptions(self)

703

try:

704

self._key_count = int(options_line[len(_OPTION_LEN):])

705

except ValueError:

706

raise errors.BadIndexOptions(self)

707

# calculate the bytes we have processed

708

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

709

len(lines[2]) + 3)

710

self._parsed_bytes(0, None, header_end, None)

711

# setup parsing state

712

self._expected_elements = 3 + self._key_length

713

# raw data keyed by offset

714

self._keys_by_offset = {}

715

# keys with the value and node references

716

self._bisect_nodes = {}

717

return header_end, bytes[header_end:]

718

719

def _parse_region(self, offset, data):

720

"""Parse node data returned from a readv operation.

721

722

:param offset: The byte offset the data starts at.

723

:param data: The data to parse.

724

"""

725

# trim the data.

726

# end first:

727

end = offset + len(data)

728

index = self._parsed_byte_index(offset)

729

# default is to use all data

730

trim_end = None

731

# trivial check for entirely parsed data:

732

if end < self._parsed_byte_map[index][1]:

733

return

734

# accomodate overlap with data before this.

735

if offset < self._parsed_byte_map[index][1]:

736

# overlaps the lower parsed region

737

# skip the parsed data

738

trim_start = self._parsed_byte_map[index][1] - offset

739

# don't trim the start for \n

740

start_adjacent = True

741

elif offset == self._parsed_byte_map[index][1]:

742

# abuts the lower parsed region

743

# use all data

744

trim_start = None

745

# do not trim anything

746

start_adjacent = True

747

else:

748

# does not overlap the lower parsed region

749

# use all data

750

trim_start = None

751

# but trim the leading \n

752

start_adjacent = False

753

if end == self._size:

754

# lines up to the end of all data:

755

# use it all

756

trim_end = None

757

# do not strip to the last \n

758

end_adjacent = True

759

elif index + 1 == len(self._parsed_byte_map):

760

# at the end of the parsed data

761

# use it all

762

trim_end = None

763

# but strip to the last \n

764

end_adjacent = False

765

elif end == self._parsed_byte_map[index + 1][0]:

766

# buts up against the next parsed region

767

# use it all

768

trim_end = None

769

# do not strip to the last \n

770

end_adjacent = True

771

elif end > self._parsed_byte_map[index + 1][0]:

772

# overlaps into the next parsed region

773

# only consider the unparsed data

774

trim_end = self._parsed_byte_map[index + 1][0] - offset

775

# do not strip to the last \n as we know its an entire record

776

end_adjacent = True

777

else:

778

# does not overlap into the next region

779

# use it all

780

trim_end = None

781

# but strip to the last \n

782

end_adjacent = False

783

# now find bytes to discard if needed

784

if not start_adjacent:

785

# work around python bug in rfind

786

if trim_start is None:

787

trim_start = data.find('\n') + 1

788

else:

789

trim_start = data.find('\n', trim_start) + 1

790

assert trim_start != 0, 'no \n was present'

791

# print 'removing start', offset, trim_start, repr(data[:trim_start])

792

if not end_adjacent:

793

# work around python bug in rfind

794

if trim_end is None:

795

trim_end = data.rfind('\n') + 1

796

else:

797

trim_end = data.rfind('\n', None, trim_end) + 1

798

assert trim_end != 0, 'no \n was present'

799

# print 'removing end', offset, trim_end, repr(data[trim_end:])

800

# adjust offset and data to the parseable data.

801

trimmed_data = data[trim_start:trim_end]

802

assert trimmed_data, 'read unneeded data'

803

if trim_start:

804

offset += trim_start

805

# print "parsing", repr(trimmed_data)

806

# splitlines mangles the \r delimiters.. don't use it.

807

lines = trimmed_data.split('\n')

808

del lines[-1]

809

pos = offset

810

first_key = None

811

key = None

812

for line in lines:

813

if line == '':

814

# must be at the end

815

assert self._size == pos + 1, "%s %s" % (self._size, pos)

816

continue

817

elements = line.split('\0')

818

if len(elements) != self._expected_elements:

819

raise errors.BadIndexData(self)

820

# keys are tuples

821

key = tuple(elements[:self._key_length])

822

if first_key is None:

823

first_key = key

824

absent, references, value = elements[-3:]

825

ref_lists = []

826

for ref_string in references.split('\t'):

827

ref_lists.append(tuple([

828

int(ref) for ref in ref_string.split('\r') if ref

829

]))

830

ref_lists = tuple(ref_lists)

831

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

832

pos += len(line) + 1 # +1 for the \n

833

if absent:

834

continue

835

if self.node_ref_lists:

836

node_value = (value, ref_lists)

837

else:

838

node_value = value

839

self._bisect_nodes[key] = node_value

840

# print "parsed ", key

841

self._parsed_bytes(offset, first_key, offset + len(trimmed_data), key)

842

843

def _parsed_bytes(self, start, start_key, end, end_key):

844

"""Mark the bytes from start to end as parsed.

845

846

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

847

1) as parsed.

848

849

:param start: The start of the parsed region.

850

:param end: The end of the parsed region.

851

"""

852

index = self._parsed_byte_index(start)

853

new_value = (start, end)

854

new_key = (start_key, end_key)

855

if index == -1:

856

# first range parsed is always the beginning.

857

self._parsed_byte_map.insert(index, new_value)

858

self._parsed_key_map.insert(index, new_key)

859

return

860

# four cases:

861

# new region

862

# extend lower region

863

# extend higher region

864

# combine two regions

865

if (index + 1 < len(self._parsed_byte_map) and

866

self._parsed_byte_map[index][1] == start and

867

self._parsed_byte_map[index + 1][0] == end):

868

# combine two regions

869

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

870

self._parsed_byte_map[index + 1][1])

871

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

872

self._parsed_key_map[index + 1][1])

873

elif self._parsed_byte_map[index][1] == start:

874

# extend the lower entry

875

self._parsed_byte_map[index] = (

876

self._parsed_byte_map[index][0], end)

877

self._parsed_key_map[index] = (

878

self._parsed_key_map[index][0], end_key)

879

elif (index + 1 < len(self._parsed_byte_map) and

880

self._parsed_byte_map[index + 1][0] == end):

881

# extend the higher entry

882

self._parsed_byte_map[index + 1] = (

883

start, self._parsed_byte_map[index + 1][1])

884

self._parsed_key_map[index + 1] = (

885

start_key, self._parsed_key_map[index + 1][1])

886

else:

887

# new entry

888

self._parsed_byte_map.insert(index + 1, new_value)

889

self._parsed_key_map.insert(index + 1, new_key)

890

assert sorted(self._parsed_byte_map) == self._parsed_byte_map

891

assert sorted(self._parsed_key_map) == self._parsed_key_map

892

893

def _read_and_parse(self, readv_ranges):

894

"""Read the the ranges and parse the resulting data.

895

896

:param readv_ranges: A prepared readv range list.

897

"""

898

if readv_ranges:

899

readv_data = self._transport.readv(self._name, readv_ranges, True,

900

self._size)

901

# parse

902

for offset, data in readv_data:

903

if self._bisect_nodes is None:

904

# this must be the start

905

assert offset == 0

906

offset, data = self._parse_header_from_bytes(data)

907

self._parse_region(offset, data)

908

# print offset, len(data), data

909

910

def _signature(self):

911

"""The file signature for this index type."""

912

return _SIGNATURE

913

914

def validate(self):

915

"""Validate that everything in the index can be accessed."""

916

# iter_all validates completely at the moment, so just do that.

917

for node in self.iter_all_entries():

918

pass

919

920

921

class CombinedGraphIndex(object):

922

"""A GraphIndex made up from smaller GraphIndices.

923

924

The backing indices must implement GraphIndex, and are presumed to be

925

static data.

926

927

Queries against the combined index will be made against the first index,

928

and then the second and so on. The order of index's can thus influence

929

performance significantly. For example, if one index is on local disk and a

930

second on a remote server, the local disk index should be before the other

931

in the index list.

932

"""

933

934

def __init__(self, indices):

935

"""Create a CombinedGraphIndex backed by indices.

936

937

:param indices: An ordered list of indices to query for data.

938

"""

939

self._indices = indices

940

941

def __repr__(self):

942

return "%s(%s)" % (

943

self.__class__.__name__,

944

', '.join(map(repr, self._indices)))

945

946

def insert_index(self, pos, index):

947

"""Insert a new index in the list of indices to query.

948

949

:param pos: The position to insert the index.

950

:param index: The index to insert.

951

"""

952

self._indices.insert(pos, index)

953

954

def iter_all_entries(self):

955

"""Iterate over all keys within the index

956

957

Duplicate keys across child indices are presumed to have the same

958

value and are only reported once.

959

960

:return: An iterable of (index, key, reference_lists, value).

961

There is no defined order for the result iteration - it will be in

962

the most efficient order for the index.

963

"""

964

seen_keys = set()

965

for index in self._indices:

966

for node in index.iter_all_entries():

967

if node[1] not in seen_keys:

968

yield node

969

seen_keys.add(node[1])

970

971

def iter_entries(self, keys):

972

"""Iterate over keys within the index.

973

974

Duplicate keys across child indices are presumed to have the same

975

value and are only reported once.

976

977

:param keys: An iterable providing the keys to be retrieved.

978

:return: An iterable of (index, key, reference_lists, value). There is no

979

defined order for the result iteration - it will be in the most

980

efficient order for the index.

981

"""

982

keys = set(keys)

983

for index in self._indices:

984

if not keys:

985

return

986

for node in index.iter_entries(keys):

987

keys.remove(node[1])

988

yield node

989

990

def iter_entries_prefix(self, keys):

991

"""Iterate over keys within the index using prefix matching.

992

993

Duplicate keys across child indices are presumed to have the same

994

value and are only reported once.

995

996

Prefix matching is applied within the tuple of a key, not to within

997

the bytestring of each key element. e.g. if you have the keys ('foo',

998

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

999

only the former key is returned.

1000

1001

:param keys: An iterable providing the key prefixes to be retrieved.

1002

Each key prefix takes the form of a tuple the length of a key, but

1003

with the last N elements 'None' rather than a regular bytestring.

1004

The first element cannot be 'None'.

1005

:return: An iterable as per iter_all_entries, but restricted to the

1006

keys with a matching prefix to those supplied. No additional keys

1007

will be returned, and every match that is in the index will be

1008

returned.

1009

"""

1010

keys = set(keys)

1011

if not keys:

1012

return

1013

seen_keys = set()

1014

for index in self._indices:

1015

for node in index.iter_entries_prefix(keys):

1016

if node[1] in seen_keys:

1017

continue

1018

seen_keys.add(node[1])

1019

yield node

1020

1021

def key_count(self):

1022

"""Return an estimate of the number of keys in this index.

1023

1024

For CombinedGraphIndex this is approximated by the sum of the keys of

1025

the child indices. As child indices may have duplicate keys this can

1026

have a maximum error of the number of child indices * largest number of

1027

keys in any index.

1028

"""

1029

return sum((index.key_count() for index in self._indices), 0)

1030

1031

def validate(self):

1032

"""Validate that everything in the index can be accessed."""

1033

for index in self._indices:

1034

index.validate()

1035

1036

1037

class InMemoryGraphIndex(GraphIndexBuilder):

1038

"""A GraphIndex which operates entirely out of memory and is mutable.

1039

1040

This is designed to allow the accumulation of GraphIndex entries during a

1041

single write operation, where the accumulated entries need to be immediately

1042

available - for example via a CombinedGraphIndex.

1043

"""

1044

1045

def add_nodes(self, nodes):

1046

"""Add nodes to the index.

1047

1048

:param nodes: An iterable of (key, node_refs, value) entries to add.

1049

"""

1050

if self.reference_lists:

1051

for (key, value, node_refs) in nodes:

1052

self.add_node(key, value, node_refs)

1053

else:

1054

for (key, value) in nodes:

1055

self.add_node(key, value)

1056

1057

def iter_all_entries(self):

1058

"""Iterate over all keys within the index

1059

1060

:return: An iterable of (index, key, reference_lists, value). There is no

1061

defined order for the result iteration - it will be in the most

1062

efficient order for the index (in this case dictionary hash order).

1063

"""

1064

if 'evil' in debug.debug_flags:

1065

trace.mutter_callsite(3,

1066

"iter_all_entries scales with size of history.")

1067

if self.reference_lists:

1068

for key, (absent, references, value) in self._nodes.iteritems():

1069

if not absent:

1070

yield self, key, value, references

1071

else:

1072

for key, (absent, references, value) in self._nodes.iteritems():

1073

if not absent:

1074

yield self, key, value

1075

1076

def iter_entries(self, keys):

1077

"""Iterate over keys within the index.

1078

1079

:param keys: An iterable providing the keys to be retrieved.

1080

:return: An iterable of (index, key, reference_lists, value). There is no

1081

defined order for the result iteration - it will be in the most

1082

efficient order for the index (keys iteration order in this case).

1083

"""

1084

keys = set(keys)

1085

if self.reference_lists:

1086

for key in keys.intersection(self._keys):

1087

node = self._nodes[key]

1088

if not node[0]:

1089

yield self, key, node[2], node[1]

1090

else:

1091

for key in keys.intersection(self._keys):

1092

node = self._nodes[key]

1093

if not node[0]:

1094

yield self, key, node[2]

1095

1096

def iter_entries_prefix(self, keys):

1097

"""Iterate over keys within the index using prefix matching.

1098

1099

Prefix matching is applied within the tuple of a key, not to within

1100

the bytestring of each key element. e.g. if you have the keys ('foo',

1101

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1102

only the former key is returned.

1103

1104

:param keys: An iterable providing the key prefixes to be retrieved.

1105

Each key prefix takes the form of a tuple the length of a key, but

1106

with the last N elements 'None' rather than a regular bytestring.

1107

The first element cannot be 'None'.

1108

:return: An iterable as per iter_all_entries, but restricted to the

1109

keys with a matching prefix to those supplied. No additional keys

1110

will be returned, and every match that is in the index will be

1111

returned.

1112

"""

1113

# XXX: To much duplication with the GraphIndex class; consider finding

1114

# a good place to pull out the actual common logic.

1115

keys = set(keys)

1116

if not keys:

1117

return

1118

if self._key_length == 1:

1119

for key in keys:

1120

# sanity check

1121

if key[0] is None:

1122

raise errors.BadIndexKey(key)

1123

if len(key) != self._key_length:

1124

raise errors.BadIndexKey(key)

1125

node = self._nodes[key]

1126

if node[0]:

1127

continue

1128

if self.reference_lists:

1129

yield self, key, node[2], node[1]

1130

else:

1131

yield self, key, node[2]

1132

return

1133

for key in keys:

1134

# sanity check

1135

if key[0] is None:

1136

raise errors.BadIndexKey(key)

1137

if len(key) != self._key_length:

1138

raise errors.BadIndexKey(key)

1139

# find what it refers to:

1140

key_dict = self._nodes_by_key

1141

elements = list(key)

1142

# find the subdict to return

1143

try:

1144

while len(elements) and elements[0] is not None:

1145

key_dict = key_dict[elements[0]]

1146

elements.pop(0)

1147

except KeyError:

1148

# a non-existant lookup.

1149

continue

1150

if len(elements):

1151

dicts = [key_dict]

1152

while dicts:

1153

key_dict = dicts.pop(-1)

1154

# can't be empty or would not exist

1155

item, value = key_dict.iteritems().next()

1156

if type(value) == dict:

1157

# push keys

1158

dicts.extend(key_dict.itervalues())

1159

else:

1160

# yield keys

1161

for value in key_dict.itervalues():

1162

yield (self, ) + value

1163

else:

1164

yield (self, ) + key_dict

1165

1166

def key_count(self):

1167

"""Return an estimate of the number of keys in this index.

1168

1169

For InMemoryGraphIndex the estimate is exact.

1170

"""

1171

return len(self._keys)

1172

1173

def validate(self):

1174

"""In memory index's have no known corruption at the moment."""

1175

1176

1177

class GraphIndexPrefixAdapter(object):

1178

"""An adapter between GraphIndex with different key lengths.

1179

1180

Queries against this will emit queries against the adapted Graph with the

1181

prefix added, queries for all items use iter_entries_prefix. The returned

1182

nodes will have their keys and node references adjusted to remove the

1183

prefix. Finally, an add_nodes_callback can be supplied - when called the

1184

nodes and references being added will have prefix prepended.

1185

"""

1186

1187

def __init__(self, adapted, prefix, missing_key_length,

1188

add_nodes_callback=None):

1189

"""Construct an adapter against adapted with prefix."""

1190

self.adapted = adapted

1191

self.prefix_key = prefix + (None,)*missing_key_length

1192

self.prefix = prefix

1193

self.prefix_len = len(prefix)

1194

self.add_nodes_callback = add_nodes_callback

1195

1196

def add_nodes(self, nodes):

1197

"""Add nodes to the index.

1198

1199

:param nodes: An iterable of (key, node_refs, value) entries to add.

1200

"""

1201

# save nodes in case its an iterator

1202

nodes = tuple(nodes)

1203

translated_nodes = []

1204

try:

1205

# Add prefix_key to each reference node_refs is a tuple of tuples,

1206

# so split it apart, and add prefix_key to the internal reference

1207

for (key, value, node_refs) in nodes:

1208

adjusted_references = (

1209

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1210

for ref_list in node_refs))

1211

translated_nodes.append((self.prefix + key, value,

1212

adjusted_references))

1213

except ValueError:

1214

# XXX: TODO add an explicit interface for getting the reference list

1215

# status, to handle this bit of user-friendliness in the API more

1216

# explicitly.

1217

for (key, value) in nodes:

1218

translated_nodes.append((self.prefix + key, value))

1219

self.add_nodes_callback(translated_nodes)

1220

1221

def add_node(self, key, value, references=()):

1222

"""Add a node to the index.

1223

1224

:param key: The key. keys are non-empty tuples containing

1225

as many whitespace-free utf8 bytestrings as the key length

1226

defined for this index.

1227

:param references: An iterable of iterables of keys. Each is a

1228

reference to another key.

1229

:param value: The value to associate with the key. It may be any

1230

bytes as long as it does not contain \0 or \n.

1231

"""

1232

self.add_nodes(((key, value, references), ))

1233

1234

def _strip_prefix(self, an_iter):

1235

"""Strip prefix data from nodes and return it."""

1236

for node in an_iter:

1237

# cross checks

1238

if node[1][:self.prefix_len] != self.prefix:

1239

raise errors.BadIndexData(self)

1240

for ref_list in node[3]:

1241

for ref_node in ref_list:

1242

if ref_node[:self.prefix_len] != self.prefix:

1243

raise errors.BadIndexData(self)

1244

yield node[0], node[1][self.prefix_len:], node[2], (

1245

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1246

for ref_list in node[3]))

1247

1248

def iter_all_entries(self):

1249

"""Iterate over all keys within the index

1250

1251

iter_all_entries is implemented against the adapted index using

1252

iter_entries_prefix.

1253

1254

:return: An iterable of (index, key, reference_lists, value). There is no

1255

defined order for the result iteration - it will be in the most

1256

efficient order for the index (in this case dictionary hash order).

1257

"""

1258

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1259

1260

def iter_entries(self, keys):

1261

"""Iterate over keys within the index.

1262

1263

:param keys: An iterable providing the keys to be retrieved.

1264

:return: An iterable of (key, reference_lists, value). There is no

1265

defined order for the result iteration - it will be in the most

1266

efficient order for the index (keys iteration order in this case).

1267

"""

1268

return self._strip_prefix(self.adapted.iter_entries(

1269

self.prefix + key for key in keys))

1270

1271

def iter_entries_prefix(self, keys):

1272

"""Iterate over keys within the index using prefix matching.

1273

1274

Prefix matching is applied within the tuple of a key, not to within

1275

the bytestring of each key element. e.g. if you have the keys ('foo',

1276

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1277

only the former key is returned.

1278

1279

:param keys: An iterable providing the key prefixes to be retrieved.

1280

Each key prefix takes the form of a tuple the length of a key, but

1281

with the last N elements 'None' rather than a regular bytestring.

1282

The first element cannot be 'None'.

1283

:return: An iterable as per iter_all_entries, but restricted to the

1284

keys with a matching prefix to those supplied. No additional keys

1285

will be returned, and every match that is in the index will be

1286

returned.

1287

"""

1288

return self._strip_prefix(self.adapted.iter_entries_prefix(

1289

self.prefix + key for key in keys))

1290

1291

def key_count(self):

1292

"""Return an estimate of the number of keys in this index.

1293

1294

For GraphIndexPrefixAdapter this is relatively expensive - key

1295

iteration with the prefix is done.

1296

"""

1297

return len(list(self.iter_all_entries()))

1298

1299

def validate(self):

1300

"""Call the adapted's validate."""

1301

self.adapted.validate()

Older »