/brz/remove-bazaar : revision 2743.1.4

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Robert Collins
Date: 2007-08-22 22:32:23 UTC
mto: This revision was merged to the branch mainline in revision 2744.
Revision ID: robertc@robertcollins.net-20070822223223-0heetwybcuonp00g

Fix an off-by-one in check.py that leads to the progress bar showing
complete for a phase but not actually being complete; if the last file id
checked is big this is confusing. (Robert Collins)

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics.py

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/multiparent.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/HttpServer.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/last-modified.txt

doc/developers/merge-scaling.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/uncommit.txt

doc/en

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/user-guide

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/centralized_workflow.txt

doc/en/user-guide/configuration.txt

doc/en/user-guide/conflicts.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/tutorial.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/version_info.txt

doc/en/user-reference

doc/index.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

tools/win32/survey.txt

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from cStringIO import StringIO

import re

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib.trace import mutter

""")

from bzrlib import debug, errors

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

self._nodes = {}

self._nodes_by_key = {}

self._key_length = key_elements

def _check_key(self, key):

"""Raise BadIndexKey if key is not a valid key for this index."""

if type(key) != tuple:

raise errors.BadIndexKey(key)

if self._key_length != len(key):

raise errors.BadIndexKey(key)

for element in key:

if not element or _whitespace_re.search(element) is not None:

raise errors.BadIndexKey(element)

def add_node(self, key, value, references=()):

"""Add a node to the index.

:param key: The key. keys are non-empty tuples containing

as many whitespace-free utf8 bytestrings as the key length

defined for this index.

:param references: An iterable of iterables of keys. Each is a

reference to another key.

:param value: The value to associate with the key. It may be any

bytes as long as it does not contain \0 or \n.

"""

self._check_key(key)

100

if _newline_null_re.search(value) is not None:

101

raise errors.BadIndexValue(value)

102

if len(references) != self.reference_lists:

103

raise errors.BadIndexValue(references)

104

node_refs = []

105

for reference_list in references:

106

for reference in reference_list:

107

self._check_key(reference)

108

if reference not in self._nodes:

109

self._nodes[reference] = ('a', (), '')

110

node_refs.append(tuple(reference_list))

111

if key in self._nodes and self._nodes[key][0] == '':

112

raise errors.BadIndexDuplicateKey(key, self)

113

self._nodes[key] = ('', tuple(node_refs), value)

114

self._keys.add(key)

115

if self._key_length > 1:

116

key_dict = self._nodes_by_key

117

if self.reference_lists:

118

key_value = key, value, tuple(node_refs)

119

else:

120

key_value = key, value

121

# possibly should do this on-demand, but it seems likely it is

122

# always wanted

123

# For a key of (foo, bar, baz) create

124

# _nodes_by_key[foo][bar][baz] = key_value

125

for subkey in key[:-1]:

126

key_dict = key_dict.setdefault(subkey, {})

127

key_dict[key[-1]] = key_value

128

129

def finish(self):

130

lines = [_SIGNATURE]

131

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

132

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

133

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

134

prefix_length = sum(len(x) for x in lines)

135

# references are byte offsets. To avoid having to do nasty

136

# polynomial work to resolve offsets (references to later in the

137

# file cannot be determined until all the inbetween references have

138

# been calculated too) we pad the offsets with 0's to make them be

139

# of consistent length. Using binary offsets would break the trivial

140

# file parsing.

141

# to calculate the width of zero's needed we do three passes:

142

# one to gather all the non-reference data and the number of references.

143

# one to pad all the data with reference-length and determine entry

144

# addresses.

145

# One to serialise.

146

147

# forward sorted by key. In future we may consider topological sorting,

148

# at the cost of table scans for direct lookup, or a second index for

149

# direct lookup

150

nodes = sorted(self._nodes.items())

151

# if we do not prepass, we don't know how long it will be up front.

152

expected_bytes = None

153

# we only need to pre-pass if we have reference lists at all.

154

if self.reference_lists:

155

key_offset_info = []

156

non_ref_bytes = prefix_length

157

total_references = 0

158

# TODO use simple multiplication for the constants in this loop.

159

for key, (absent, references, value) in nodes:

160

# record the offset known *so far* for this key:

161

# the non reference bytes to date, and the total references to

162

# date - saves reaccumulating on the second pass

163

key_offset_info.append((key, non_ref_bytes, total_references))

164

# key is literal, value is literal, there are 3 null's, 1 NL

165

# key is variable length tuple, \x00 between elements

166

non_ref_bytes += sum(len(element) for element in key)

167

if self._key_length > 1:

168

non_ref_bytes += self._key_length - 1

169

# value is literal bytes, there are 3 null's, 1 NL.

170

non_ref_bytes += len(value) + 3 + 1

171

# one byte for absent if set.

172

if absent:

173

non_ref_bytes += 1

174

elif self.reference_lists:

175

# (ref_lists -1) tabs

176

non_ref_bytes += self.reference_lists - 1

177

# (ref-1 cr's per ref_list)

178

for ref_list in references:

179

# how many references across the whole file?

180

total_references += len(ref_list)

181

# accrue reference separators

182

if ref_list:

183

non_ref_bytes += len(ref_list) - 1

184

# how many digits are needed to represent the total byte count?

185

digits = 1

186

possible_total_bytes = non_ref_bytes + total_references*digits

187

while 10 ** digits < possible_total_bytes:

188

digits += 1

189

possible_total_bytes = non_ref_bytes + total_references*digits

190

expected_bytes = possible_total_bytes + 1 # terminating newline

191

# resolve key addresses.

192

key_addresses = {}

193

for key, non_ref_bytes, total_references in key_offset_info:

194

key_addresses[key] = non_ref_bytes + total_references*digits

195

# serialise

196

format_string = '%%0%sd' % digits

197

for key, (absent, references, value) in nodes:

198

flattened_references = []

199

for ref_list in references:

200

ref_addresses = []

201

for reference in ref_list:

202

ref_addresses.append(format_string % key_addresses[reference])

203

flattened_references.append('\r'.join(ref_addresses))

204

string_key = '\x00'.join(key)

205

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

206

'\t'.join(flattened_references), value))

207

lines.append('\n')

208

result = StringIO(''.join(lines))

209

if expected_bytes and len(result.getvalue()) != expected_bytes:

210

raise errors.BzrError('Failed index creation. Internal error:'

211

' mismatched output length and expected length: %d %d' %

212

(len(result.getvalue()), expected_bytes))

213

return StringIO(''.join(lines))

214

215

216

class GraphIndex(object):

217

"""An index for data with embedded graphs.

218

219

The index maps keys to a list of key reference lists, and a value.

220

Each node has the same number of key reference lists. Each key reference

221

list can be empty or an arbitrary length. The value is an opaque NULL

222

terminated string without any newlines. The storage of the index is

223

hidden in the interface: keys and key references are always tuples of

224

bytestrings, never the internal representation (e.g. dictionary offsets).

225

226

It is presumed that the index will not be mutated - it is static data.

227

228

Successive iter_all_entries calls will read the entire index each time.

229

Additionally, iter_entries calls will read the index linearly until the

230

desired keys are found. XXX: This must be fixed before the index is

231

suitable for production use. :XXX

232

"""

233

234

def __init__(self, transport, name):

235

"""Open an index called name on transport.

236

237

:param transport: A bzrlib.transport.Transport.

238

:param name: A path to provide to transport API calls.

239

"""

240

self._transport = transport

241

self._name = name

242

self._nodes = None

243

self._key_count = None

244

self._keys_by_offset = None

245

self._nodes_by_key = None

246

247

def _buffer_all(self):

248

"""Buffer all the index data.

249

250

Mutates self._nodes and self.keys_by_offset.

251

"""

252

if 'index' in debug.debug_flags:

253

mutter('Reading entire index %s', self._transport.abspath(self._name))

254

stream = self._transport.get(self._name)

255

self._read_prefix(stream)

256

expected_elements = 3 + self._key_length

257

line_count = 0

258

# raw data keyed by offset

259

self._keys_by_offset = {}

260

# ready-to-return key:value or key:value, node_ref_lists

261

self._nodes = {}

262

self._nodes_by_key = {}

263

trailers = 0

264

pos = stream.tell()

265

for line in stream.readlines():

266

if line == '\n':

267

trailers += 1

268

continue

269

elements = line.split('\0')

270

if len(elements) != expected_elements:

271

raise errors.BadIndexData(self)

272

# keys are tuples

273

key = tuple(elements[:self._key_length])

274

absent, references, value = elements[-3:]

275

value = value[:-1] # remove the newline

276

ref_lists = []

277

for ref_string in references.split('\t'):

278

ref_lists.append(tuple([

279

int(ref) for ref in ref_string.split('\r') if ref

280

]))

281

ref_lists = tuple(ref_lists)

282

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

283

pos += len(line)

284

for key, absent, references, value in self._keys_by_offset.itervalues():

285

if absent:

286

continue

287

# resolve references:

288

if self.node_ref_lists:

289

node_refs = []

290

for ref_list in references:

291

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

292

node_value = (value, tuple(node_refs))

293

else:

294

node_value = value

295

self._nodes[key] = node_value

296

if self._key_length > 1:

297

subkey = list(reversed(key[:-1]))

298

key_dict = self._nodes_by_key

299

if self.node_ref_lists:

300

key_value = key, node_value[0], node_value[1]

301

else:

302

key_value = key, node_value

303

# possibly should do this on-demand, but it seems likely it is

304

# always wanted

305

# For a key of (foo, bar, baz) create

306

# _nodes_by_key[foo][bar][baz] = key_value

307

for subkey in key[:-1]:

308

key_dict = key_dict.setdefault(subkey, {})

309

key_dict[key[-1]] = key_value

310

# cache the keys for quick set intersections

311

self._keys = set(self._nodes)

312

if trailers != 1:

313

# there must be one line - the empty trailer line.

314

raise errors.BadIndexData(self)

315

316

def iter_all_entries(self):

317

"""Iterate over all keys within the index.

318

319

:return: An iterable of (key, value) or (key, value, reference_lists).

320

The former tuple is used when there are no reference lists in the

321

index, making the API compatible with simple key:value index types.

322

There is no defined order for the result iteration - it will be in

323

the most efficient order for the index.

324

"""

325

if self._nodes is None:

326

self._buffer_all()

327

if self.node_ref_lists:

328

for key, (value, node_ref_lists) in self._nodes.iteritems():

329

yield self, key, value, node_ref_lists

330

else:

331

for key, value in self._nodes.iteritems():

332

yield self, key, value

333

334

def _read_prefix(self, stream):

335

signature = stream.read(len(self._signature()))

336

if not signature == self._signature():

337

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

338

options_line = stream.readline()

339

if not options_line.startswith(_OPTION_NODE_REFS):

340

raise errors.BadIndexOptions(self)

341

try:

342

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

343

except ValueError:

344

raise errors.BadIndexOptions(self)

345

options_line = stream.readline()

346

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

347

raise errors.BadIndexOptions(self)

348

try:

349

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

350

except ValueError:

351

raise errors.BadIndexOptions(self)

352

options_line = stream.readline()

353

if not options_line.startswith(_OPTION_LEN):

354

raise errors.BadIndexOptions(self)

355

try:

356

self._key_count = int(options_line[len(_OPTION_LEN):-1])

357

except ValueError:

358

raise errors.BadIndexOptions(self)

359

360

def iter_entries(self, keys):

361

"""Iterate over keys within the index.

362

363

:param keys: An iterable providing the keys to be retrieved.

364

:return: An iterable as per iter_all_entries, but restricted to the

365

keys supplied. No additional keys will be returned, and every

366

key supplied that is in the index will be returned.

367

"""

368

keys = set(keys)

369

if not keys:

370

return

371

if self._nodes is None:

372

self._buffer_all()

373

keys = keys.intersection(self._keys)

374

if self.node_ref_lists:

375

for key in keys:

376

value, node_refs = self._nodes[key]

377

yield self, key, value, node_refs

378

else:

379

for key in keys:

380

yield self, key, self._nodes[key]

381

382

def iter_entries_prefix(self, keys):

383

"""Iterate over keys within the index using prefix matching.

384

385

Prefix matching is applied within the tuple of a key, not to within

386

the bytestring of each key element. e.g. if you have the keys ('foo',

387

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

388

only the former key is returned.

389

390

:param keys: An iterable providing the key prefixes to be retrieved.

391

Each key prefix takes the form of a tuple the length of a key, but

392

with the last N elements 'None' rather than a regular bytestring.

393

The first element cannot be 'None'.

394

:return: An iterable as per iter_all_entries, but restricted to the

395

keys with a matching prefix to those supplied. No additional keys

396

will be returned, and every match that is in the index will be

397

returned.

398

"""

399

keys = set(keys)

400

if not keys:

401

return

402

# load data - also finds key lengths

403

if self._nodes is None:

404

self._buffer_all()

405

if self._key_length == 1:

406

for key in keys:

407

# sanity check

408

if key[0] is None:

409

raise errors.BadIndexKey(key)

410

if len(key) != self._key_length:

411

raise errors.BadIndexKey(key)

412

if self.node_ref_lists:

413

value, node_refs = self._nodes[key]

414

yield self, key, value, node_refs

415

else:

416

yield self, key, self._nodes[key]

417

return

418

for key in keys:

419

# sanity check

420

if key[0] is None:

421

raise errors.BadIndexKey(key)

422

if len(key) != self._key_length:

423

raise errors.BadIndexKey(key)

424

# find what it refers to:

425

key_dict = self._nodes_by_key

426

elements = list(key)

427

# find the subdict whose contents should be returned.

428

try:

429

while len(elements) and elements[0] is not None:

430

key_dict = key_dict[elements[0]]

431

elements.pop(0)

432

except KeyError:

433

# a non-existant lookup.

434

continue

435

if len(elements):

436

dicts = [key_dict]

437

while dicts:

438

key_dict = dicts.pop(-1)

439

# can't be empty or would not exist

440

item, value = key_dict.iteritems().next()

441

if type(value) == dict:

442

# push keys

443

dicts.extend(key_dict.itervalues())

444

else:

445

# yield keys

446

for value in key_dict.itervalues():

447

# each value is the key:value:node refs tuple

448

# ready to yield.

449

yield (self, ) + value

450

else:

451

# the last thing looked up was a terminal element

452

yield (self, ) + key_dict

453

454

def key_count(self):

455

"""Return an estimate of the number of keys in this index.

456

457

For GraphIndex the estimate is exact.

458

"""

459

if self._key_count is None:

460

# really this should just read the prefix

461

self._buffer_all()

462

return self._key_count

463

464

def _signature(self):

465

"""The file signature for this index type."""

466

return _SIGNATURE

467

468

def validate(self):

469

"""Validate that everything in the index can be accessed."""

470

# iter_all validates completely at the moment, so just do that.

471

for node in self.iter_all_entries():

472

pass

473

474

475

class CombinedGraphIndex(object):

476

"""A GraphIndex made up from smaller GraphIndices.

477

478

The backing indices must implement GraphIndex, and are presumed to be

479

static data.

480

481

Queries against the combined index will be made against the first index,

482

and then the second and so on. The order of index's can thus influence

483

performance significantly. For example, if one index is on local disk and a

484

second on a remote server, the local disk index should be before the other

485

in the index list.

486

"""

487

488

def __init__(self, indices):

489

"""Create a CombinedGraphIndex backed by indices.

490

491

:param indices: An ordered list of indices to query for data.

492

"""

493

self._indices = indices

494

495

def insert_index(self, pos, index):

496

"""Insert a new index in the list of indices to query.

497

498

:param pos: The position to insert the index.

499

:param index: The index to insert.

500

"""

501

self._indices.insert(pos, index)

502

503

def iter_all_entries(self):

504

"""Iterate over all keys within the index

505

506

Duplicate keys across child indices are presumed to have the same

507

value and are only reported once.

508

509

:return: An iterable of (key, reference_lists, value). There is no

510

defined order for the result iteration - it will be in the most

511

efficient order for the index.

512

"""

513

seen_keys = set()

514

for index in self._indices:

515

for node in index.iter_all_entries():

516

if node[1] not in seen_keys:

517

yield node

518

seen_keys.add(node[1])

519

520

def iter_entries(self, keys):

521

"""Iterate over keys within the index.

522

523

Duplicate keys across child indices are presumed to have the same

524

value and are only reported once.

525

526

:param keys: An iterable providing the keys to be retrieved.

527

:return: An iterable of (key, reference_lists, value). There is no

528

defined order for the result iteration - it will be in the most

529

efficient order for the index.

530

"""

531

keys = set(keys)

532

for index in self._indices:

533

if not keys:

534

return

535

for node in index.iter_entries(keys):

536

keys.remove(node[1])

537

yield node

538

539

def iter_entries_prefix(self, keys):

540

"""Iterate over keys within the index using prefix matching.

541

542

Duplicate keys across child indices are presumed to have the same

543

value and are only reported once.

544

545

Prefix matching is applied within the tuple of a key, not to within

546

the bytestring of each key element. e.g. if you have the keys ('foo',

547

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

548

only the former key is returned.

549

550

:param keys: An iterable providing the key prefixes to be retrieved.

551

Each key prefix takes the form of a tuple the length of a key, but

552

with the last N elements 'None' rather than a regular bytestring.

553

The first element cannot be 'None'.

554

:return: An iterable as per iter_all_entries, but restricted to the

555

keys with a matching prefix to those supplied. No additional keys

556

will be returned, and every match that is in the index will be

557

returned.

558

"""

559

keys = set(keys)

560

if not keys:

561

return

562

seen_keys = set()

563

for index in self._indices:

564

for node in index.iter_entries_prefix(keys):

565

if node[1] in seen_keys:

566

continue

567

seen_keys.add(node[1])

568

yield node

569

570

def key_count(self):

571

"""Return an estimate of the number of keys in this index.

572

573

For CombinedGraphIndex this is approximated by the sum of the keys of

574

the child indices. As child indices may have duplicate keys this can

575

have a maximum error of the number of child indices * largest number of

576

keys in any index.

577

"""

578

return sum((index.key_count() for index in self._indices), 0)

579

580

def validate(self):

581

"""Validate that everything in the index can be accessed."""

582

for index in self._indices:

583

index.validate()

584

585

586

class InMemoryGraphIndex(GraphIndexBuilder):

587

"""A GraphIndex which operates entirely out of memory and is mutable.

588

589

This is designed to allow the accumulation of GraphIndex entries during a

590

single write operation, where the accumulated entries need to be immediately

591

available - for example via a CombinedGraphIndex.

592

"""

593

594

def add_nodes(self, nodes):

595

"""Add nodes to the index.

596

597

:param nodes: An iterable of (key, node_refs, value) entries to add.

598

"""

599

if self.reference_lists:

600

for (key, value, node_refs) in nodes:

601

self.add_node(key, value, node_refs)

602

else:

603

for (key, value) in nodes:

604

self.add_node(key, value)

605

606

def iter_all_entries(self):

607

"""Iterate over all keys within the index

608

609

:return: An iterable of (key, reference_lists, value). There is no

610

defined order for the result iteration - it will be in the most

611

efficient order for the index (in this case dictionary hash order).

612

"""

613

if self.reference_lists:

614

for key, (absent, references, value) in self._nodes.iteritems():

615

if not absent:

616

yield self, key, value, references

617

else:

618

for key, (absent, references, value) in self._nodes.iteritems():

619

if not absent:

620

yield self, key, value

621

622

def iter_entries(self, keys):

623

"""Iterate over keys within the index.

624

625

:param keys: An iterable providing the keys to be retrieved.

626

:return: An iterable of (key, reference_lists, value). There is no

627

defined order for the result iteration - it will be in the most

628

efficient order for the index (keys iteration order in this case).

629

"""

630

keys = set(keys)

631

if self.reference_lists:

632

for key in keys.intersection(self._keys):

633

node = self._nodes[key]

634

if not node[0]:

635

yield self, key, node[2], node[1]

636

else:

637

for key in keys.intersection(self._keys):

638

node = self._nodes[key]

639

if not node[0]:

640

yield self, key, node[2]

641

642

def iter_entries_prefix(self, keys):

643

"""Iterate over keys within the index using prefix matching.

644

645

Prefix matching is applied within the tuple of a key, not to within

646

the bytestring of each key element. e.g. if you have the keys ('foo',

647

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

648

only the former key is returned.

649

650

:param keys: An iterable providing the key prefixes to be retrieved.

651

Each key prefix takes the form of a tuple the length of a key, but

652

with the last N elements 'None' rather than a regular bytestring.

653

The first element cannot be 'None'.

654

:return: An iterable as per iter_all_entries, but restricted to the

655

keys with a matching prefix to those supplied. No additional keys

656

will be returned, and every match that is in the index will be

657

returned.

658

"""

659

# XXX: To much duplication with the GraphIndex class; consider finding

660

# a good place to pull out the actual common logic.

661

keys = set(keys)

662

if not keys:

663

return

664

if self._key_length == 1:

665

for key in keys:

666

# sanity check

667

if key[0] is None:

668

raise errors.BadIndexKey(key)

669

if len(key) != self._key_length:

670

raise errors.BadIndexKey(key)

671

node = self._nodes[key]

672

if node[0]:

673

continue

674

if self.reference_lists:

675

yield self, key, node[2], node[1]

676

else:

677

yield self, key, node[2]

678

return

679

for key in keys:

680

# sanity check

681

if key[0] is None:

682

raise errors.BadIndexKey(key)

683

if len(key) != self._key_length:

684

raise errors.BadIndexKey(key)

685

# find what it refers to:

686

key_dict = self._nodes_by_key

687

elements = list(key)

688

# find the subdict to return

689

try:

690

while len(elements) and elements[0] is not None:

691

key_dict = key_dict[elements[0]]

692

elements.pop(0)

693

except KeyError:

694

# a non-existant lookup.

695

continue

696

if len(elements):

697

dicts = [key_dict]

698

while dicts:

699

key_dict = dicts.pop(-1)

700

# can't be empty or would not exist

701

item, value = key_dict.iteritems().next()

702

if type(value) == dict:

703

# push keys

704

dicts.extend(key_dict.itervalues())

705

else:

706

# yield keys

707

for value in key_dict.itervalues():

708

yield (self, ) + value

709

else:

710

yield (self, ) + key_dict

711

712

def key_count(self):

713

"""Return an estimate of the number of keys in this index.

714

715

For InMemoryGraphIndex the estimate is exact.

716

"""

717

return len(self._keys)

718

719

def validate(self):

720

"""In memory index's have no known corruption at the moment."""

721

722

723

class GraphIndexPrefixAdapter(object):

724

"""An adapter between GraphIndex with different key lengths.

725

726

Queries against this will emit queries against the adapted Graph with the

727

prefix added, queries for all items use iter_entries_prefix. The returned

728

nodes will have their keys and node references adjusted to remove the

729

prefix. Finally, an add_nodes_callback can be supplied - when called the

730

nodes and references being added will have prefix prepended.

731

"""

732

733

def __init__(self, adapted, prefix, missing_key_length,

734

add_nodes_callback=None):

735

"""Construct an adapter against adapted with prefix."""

736

self.adapted = adapted

737

self.prefix_key = prefix + (None,)*missing_key_length

738

self.prefix = prefix

739

self.prefix_len = len(prefix)

740

self.add_nodes_callback = add_nodes_callback

741

742

def add_nodes(self, nodes):

743

"""Add nodes to the index.

744

745

:param nodes: An iterable of (key, node_refs, value) entries to add.

746

"""

747

# save nodes in case its an iterator

748

nodes = tuple(nodes)

749

translated_nodes = []

750

try:

751

# Add prefix_key to each reference node_refs is a tuple of tuples,

752

# so split it apart, and add prefix_key to the internal reference

753

for (key, value, node_refs) in nodes:

754

adjusted_references = (

755

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

756

for ref_list in node_refs))

757

translated_nodes.append((self.prefix + key, value,

758

adjusted_references))

759

except ValueError:

760

# XXX: TODO add an explicit interface for getting the reference list

761

# status, to handle this bit of user-friendliness in the API more

762

# explicitly.

763

for (key, value) in nodes:

764

translated_nodes.append((self.prefix + key, value))

765

self.add_nodes_callback(translated_nodes)

766

767

def add_node(self, key, value, references=()):

768

"""Add a node to the index.

769

770

:param key: The key. keys are non-empty tuples containing

771

as many whitespace-free utf8 bytestrings as the key length

772

defined for this index.

773

:param references: An iterable of iterables of keys. Each is a

774

reference to another key.

775

:param value: The value to associate with the key. It may be any

776

bytes as long as it does not contain \0 or \n.

777

"""

778

self.add_nodes(((key, value, references), ))

779

780

def _strip_prefix(self, an_iter):

781

"""Strip prefix data from nodes and return it."""

782

for node in an_iter:

783

# cross checks

784

if node[1][:self.prefix_len] != self.prefix:

785

raise errors.BadIndexData(self)

786

for ref_list in node[3]:

787

for ref_node in ref_list:

788

if ref_node[:self.prefix_len] != self.prefix:

789

raise errors.BadIndexData(self)

790

yield node[0], node[1][self.prefix_len:], node[2], (

791

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

792

for ref_list in node[3]))

793

794

def iter_all_entries(self):

795

"""Iterate over all keys within the index

796

797

iter_all_entries is implemented against the adapted index using

798

iter_entries_prefix.

799

800

:return: An iterable of (key, reference_lists, value). There is no

801

defined order for the result iteration - it will be in the most

802

efficient order for the index (in this case dictionary hash order).

803

"""

804

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

805

806

def iter_entries(self, keys):

807

"""Iterate over keys within the index.

808

809

:param keys: An iterable providing the keys to be retrieved.

810

:return: An iterable of (key, reference_lists, value). There is no

811

defined order for the result iteration - it will be in the most

812

efficient order for the index (keys iteration order in this case).

813

"""

814

return self._strip_prefix(self.adapted.iter_entries(

815

self.prefix + key for key in keys))

816

817

def iter_entries_prefix(self, keys):

818

"""Iterate over keys within the index using prefix matching.

819

820

Prefix matching is applied within the tuple of a key, not to within

821

the bytestring of each key element. e.g. if you have the keys ('foo',

822

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

823

only the former key is returned.

824

825

:param keys: An iterable providing the key prefixes to be retrieved.

826

Each key prefix takes the form of a tuple the length of a key, but

827

with the last N elements 'None' rather than a regular bytestring.

828

The first element cannot be 'None'.

829

:return: An iterable as per iter_all_entries, but restricted to the

830

keys with a matching prefix to those supplied. No additional keys

831

will be returned, and every match that is in the index will be

832

returned.

833

"""

834

return self._strip_prefix(self.adapted.iter_entries_prefix(

835

self.prefix + key for key in keys))

836

837

def key_count(self):

838

"""Return an estimate of the number of keys in this index.

839

840

For GraphIndexPrefixAdapter this is relatively expensive - key

841

iteration with the prefix is done.

842

"""

843

return len(list(self.iter_all_entries()))

844

845

def validate(self):

846

"""Call the adapted's validate."""

847

self.adapted.validate()

Older »