/brz/remove-bazaar : revision 3644.2.10

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: John Arbash Meinel
Date: 2008-08-28 20:13:31 UTC
mfrom: (3658 +trunk)
mto: This revision was merged to the branch mainline in revision 3688.
Revision ID: john@arbash-meinel.com-20080828201331-dqffxf54l2heokll

Merge bzr.dev 3658

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_walkdirs_win32.h

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chunk_writer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_add_fallback_repository.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_get_parent_map.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/developer-guide/testing.txt

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

self._key_length = key_elements

def _check_key(self, key):

"""Raise BadIndexKey if key is not a valid key for this index."""

if type(key) != tuple:

raise errors.BadIndexKey(key)

if self._key_length != len(key):

raise errors.BadIndexKey(key)

for element in key:

if not element or _whitespace_re.search(element) is not None:

raise errors.BadIndexKey(element)

def _get_nodes_by_key(self):

if self._nodes_by_key is None:

100

nodes_by_key = {}

101

if self.reference_lists:

102

for key, (absent, references, value) in self._nodes.iteritems():

103

if absent:

104

continue

105

key_dict = nodes_by_key

106

for subkey in key[:-1]:

107

key_dict = key_dict.setdefault(subkey, {})

108

key_dict[key[-1]] = key, value, references

109

else:

110

for key, (absent, references, value) in self._nodes.iteritems():

111

if absent:

112

continue

113

key_dict = nodes_by_key

114

for subkey in key[:-1]:

115

key_dict = key_dict.setdefault(subkey, {})

116

key_dict[key[-1]] = key, value

117

self._nodes_by_key = nodes_by_key

118

return self._nodes_by_key

119

120

def _update_nodes_by_key(self, key, value, node_refs):

121

"""Update the _nodes_by_key dict with a new key.

122

123

For a key of (foo, bar, baz) create

124

_nodes_by_key[foo][bar][baz] = key_value

125

"""

126

if self._nodes_by_key is None:

127

return

128

key_dict = self._nodes_by_key

129

if self.reference_lists:

130

key_value = key, value, node_refs

131

else:

132

key_value = key, value

133

for subkey in key[:-1]:

134

key_dict = key_dict.setdefault(subkey, {})

135

key_dict[key[-1]] = key_value

136

137

def _check_key_ref_value(self, key, references, value):

138

"""Check that 'key' and 'references' are all valid.

139

140

:param key: A key tuple. Must conform to the key interface (be a tuple,

141

be of the right length, not have any whitespace or nulls in any key

142

element.)

143

:param references: An iterable of reference lists. Something like

144

[[(ref, key)], [(ref, key), (other, key)]]

145

:param value: The value associate with this key. Must not contain

146

newlines or null characters.

147

:return: (node_refs, absent_references)

148

node_refs basically a packed form of 'references' where all

149

iterables are tuples

150

absent_references reference keys that are not in self._nodes.

151

This may contain duplicates if the same key is

152

referenced in multiple lists.

153

"""

154

self._check_key(key)

155

if _newline_null_re.search(value) is not None:

156

raise errors.BadIndexValue(value)

157

if len(references) != self.reference_lists:

158

raise errors.BadIndexValue(references)

159

node_refs = []

160

absent_references = []

161

for reference_list in references:

162

for reference in reference_list:

163

# If reference *is* in self._nodes, then we know it has already

164

# been checked.

165

if reference not in self._nodes:

166

self._check_key(reference)

167

absent_references.append(reference)

168

node_refs.append(tuple(reference_list))

169

return tuple(node_refs), absent_references

170

171

def add_node(self, key, value, references=()):

172

"""Add a node to the index.

173

174

:param key: The key. keys are non-empty tuples containing

175

as many whitespace-free utf8 bytestrings as the key length

176

defined for this index.

177

:param references: An iterable of iterables of keys. Each is a

178

reference to another key.

179

:param value: The value to associate with the key. It may be any

180

bytes as long as it does not contain \0 or \n.

181

"""

182

(node_refs,

183

absent_references) = self._check_key_ref_value(key, references, value)

184

if key in self._nodes and self._nodes[key][0] != 'a':

185

raise errors.BadIndexDuplicateKey(key, self)

186

for reference in absent_references:

187

# There may be duplicates, but I don't think it is worth worrying

188

# about

189

self._nodes[reference] = ('a', (), '')

190

self._nodes[key] = ('', node_refs, value)

191

self._keys.add(key)

192

if self._nodes_by_key is not None and self._key_length > 1:

193

self._update_nodes_by_key(key, value, node_refs)

194

195

def finish(self):

196

lines = [_SIGNATURE]

197

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

198

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

199

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

200

prefix_length = sum(len(x) for x in lines)

201

# references are byte offsets. To avoid having to do nasty

202

# polynomial work to resolve offsets (references to later in the

203

# file cannot be determined until all the inbetween references have

204

# been calculated too) we pad the offsets with 0's to make them be

205

# of consistent length. Using binary offsets would break the trivial

206

# file parsing.

207

# to calculate the width of zero's needed we do three passes:

208

# one to gather all the non-reference data and the number of references.

209

# one to pad all the data with reference-length and determine entry

210

# addresses.

211

# One to serialise.

212

213

# forward sorted by key. In future we may consider topological sorting,

214

# at the cost of table scans for direct lookup, or a second index for

215

# direct lookup

216

nodes = sorted(self._nodes.items())

217

# if we do not prepass, we don't know how long it will be up front.

218

expected_bytes = None

219

# we only need to pre-pass if we have reference lists at all.

220

if self.reference_lists:

221

key_offset_info = []

222

non_ref_bytes = prefix_length

223

total_references = 0

224

# TODO use simple multiplication for the constants in this loop.

225

for key, (absent, references, value) in nodes:

226

# record the offset known *so far* for this key:

227

# the non reference bytes to date, and the total references to

228

# date - saves reaccumulating on the second pass

229

key_offset_info.append((key, non_ref_bytes, total_references))

230

# key is literal, value is literal, there are 3 null's, 1 NL

231

# key is variable length tuple, \x00 between elements

232

non_ref_bytes += sum(len(element) for element in key)

233

if self._key_length > 1:

234

non_ref_bytes += self._key_length - 1

235

# value is literal bytes, there are 3 null's, 1 NL.

236

non_ref_bytes += len(value) + 3 + 1

237

# one byte for absent if set.

238

if absent:

239

non_ref_bytes += 1

240

elif self.reference_lists:

241

# (ref_lists -1) tabs

242

non_ref_bytes += self.reference_lists - 1

243

# (ref-1 cr's per ref_list)

244

for ref_list in references:

245

# how many references across the whole file?

246

total_references += len(ref_list)

247

# accrue reference separators

248

if ref_list:

249

non_ref_bytes += len(ref_list) - 1

250

# how many digits are needed to represent the total byte count?

251

digits = 1

252

possible_total_bytes = non_ref_bytes + total_references*digits

253

while 10 ** digits < possible_total_bytes:

254

digits += 1

255

possible_total_bytes = non_ref_bytes + total_references*digits

256

expected_bytes = possible_total_bytes + 1 # terminating newline

257

# resolve key addresses.

258

key_addresses = {}

259

for key, non_ref_bytes, total_references in key_offset_info:

260

key_addresses[key] = non_ref_bytes + total_references*digits

261

# serialise

262

format_string = '%%0%sd' % digits

263

for key, (absent, references, value) in nodes:

264

flattened_references = []

265

for ref_list in references:

266

ref_addresses = []

267

for reference in ref_list:

268

ref_addresses.append(format_string % key_addresses[reference])

269

flattened_references.append('\r'.join(ref_addresses))

270

string_key = '\x00'.join(key)

271

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

272

'\t'.join(flattened_references), value))

273

lines.append('\n')

274

result = StringIO(''.join(lines))

275

if expected_bytes and len(result.getvalue()) != expected_bytes:

276

raise errors.BzrError('Failed index creation. Internal error:'

277

' mismatched output length and expected length: %d %d' %

278

(len(result.getvalue()), expected_bytes))

279

return result

280

281

282

class GraphIndex(object):

283

"""An index for data with embedded graphs.

284

285

The index maps keys to a list of key reference lists, and a value.

286

Each node has the same number of key reference lists. Each key reference

287

list can be empty or an arbitrary length. The value is an opaque NULL

288

terminated string without any newlines. The storage of the index is

289

hidden in the interface: keys and key references are always tuples of

290

bytestrings, never the internal representation (e.g. dictionary offsets).

291

292

It is presumed that the index will not be mutated - it is static data.

293

294

Successive iter_all_entries calls will read the entire index each time.

295

Additionally, iter_entries calls will read the index linearly until the

296

desired keys are found. XXX: This must be fixed before the index is

297

suitable for production use. :XXX

298

"""

299

300

def __init__(self, transport, name, size):

301

"""Open an index called name on transport.

302

303

:param transport: A bzrlib.transport.Transport.

304

:param name: A path to provide to transport API calls.

305

:param size: The size of the index in bytes. This is used for bisection

306

logic to perform partial index reads. While the size could be

307

obtained by statting the file this introduced an additional round

308

trip as well as requiring stat'able transports, both of which are

309

avoided by having it supplied. If size is None, then bisection

310

support will be disabled and accessing the index will just stream

311

all the data.

312

"""

313

self._transport = transport

314

self._name = name

315

# Becomes a dict of key:(value, reference-list-byte-locations) used by

316

# the bisection interface to store parsed but not resolved keys.

317

self._bisect_nodes = None

318

# Becomes a dict of key:(value, reference-list-keys) which are ready to

319

# be returned directly to callers.

320

self._nodes = None

321

# a sorted list of slice-addresses for the parsed bytes of the file.

322

# e.g. (0,1) would mean that byte 0 is parsed.

323

self._parsed_byte_map = []

324

# a sorted list of keys matching each slice address for parsed bytes

325

# e.g. (None, 'foo@bar') would mean that the first byte contained no

326

# key, and the end byte of the slice is the of the data for 'foo@bar'

327

self._parsed_key_map = []

328

self._key_count = None

329

self._keys_by_offset = None

330

self._nodes_by_key = None

331

self._size = size

332

333

def __eq__(self, other):

334

"""Equal when self and other were created with the same parameters."""

335

return (

336

type(self) == type(other) and

337

self._transport == other._transport and

338

self._name == other._name and

339

self._size == other._size)

340

341

def __ne__(self, other):

342

return not self.__eq__(other)

343

344

def __repr__(self):

345

return "%s(%r)" % (self.__class__.__name__,

346

self._transport.abspath(self._name))

347

348

def _buffer_all(self):

349

"""Buffer all the index data.

350

351

Mutates self._nodes and self.keys_by_offset.

352

"""

353

if 'index' in debug.debug_flags:

354

mutter('Reading entire index %s', self._transport.abspath(self._name))

355

stream = self._transport.get(self._name)

356

self._read_prefix(stream)

357

self._expected_elements = 3 + self._key_length

358

line_count = 0

359

# raw data keyed by offset

360

self._keys_by_offset = {}

361

# ready-to-return key:value or key:value, node_ref_lists

362

self._nodes = {}

363

self._nodes_by_key = {}

364

trailers = 0

365

pos = stream.tell()

366

lines = stream.read().split('\n')

367

del lines[-1]

368

_, _, _, trailers = self._parse_lines(lines, pos)

369

for key, absent, references, value in self._keys_by_offset.itervalues():

370

if absent:

371

continue

372

# resolve references:

373

if self.node_ref_lists:

374

node_value = (value, self._resolve_references(references))

375

else:

376

node_value = value

377

self._nodes[key] = node_value

378

if self._key_length > 1:

379

# TODO: We may want to do this lazily, but if we are calling

380

# _buffer_all, we are likely to be doing

381

# iter_entries_prefix

382

key_dict = self._nodes_by_key

383

if self.node_ref_lists:

384

key_value = key, node_value[0], node_value[1]

385

else:

386

key_value = key, node_value

387

# For a key of (foo, bar, baz) create

388

# _nodes_by_key[foo][bar][baz] = key_value

389

for subkey in key[:-1]:

390

key_dict = key_dict.setdefault(subkey, {})

391

key_dict[key[-1]] = key_value

392

# cache the keys for quick set intersections

393

self._keys = set(self._nodes)

394

if trailers != 1:

395

# there must be one line - the empty trailer line.

396

raise errors.BadIndexData(self)

397

398

def iter_all_entries(self):

399

"""Iterate over all keys within the index.

400

401

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

402

The former tuple is used when there are no reference lists in the

403

index, making the API compatible with simple key:value index types.

404

There is no defined order for the result iteration - it will be in

405

the most efficient order for the index.

406

"""

407

if 'evil' in debug.debug_flags:

408

trace.mutter_callsite(3,

409

"iter_all_entries scales with size of history.")

410

if self._nodes is None:

411

self._buffer_all()

412

if self.node_ref_lists:

413

for key, (value, node_ref_lists) in self._nodes.iteritems():

414

yield self, key, value, node_ref_lists

415

else:

416

for key, value in self._nodes.iteritems():

417

yield self, key, value

418

419

def _read_prefix(self, stream):

420

signature = stream.read(len(self._signature()))

421

if not signature == self._signature():

422

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

423

options_line = stream.readline()

424

if not options_line.startswith(_OPTION_NODE_REFS):

425

raise errors.BadIndexOptions(self)

426

try:

427

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

428

except ValueError:

429

raise errors.BadIndexOptions(self)

430

options_line = stream.readline()

431

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

432

raise errors.BadIndexOptions(self)

433

try:

434

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

435

except ValueError:

436

raise errors.BadIndexOptions(self)

437

options_line = stream.readline()

438

if not options_line.startswith(_OPTION_LEN):

439

raise errors.BadIndexOptions(self)

440

try:

441

self._key_count = int(options_line[len(_OPTION_LEN):-1])

442

except ValueError:

443

raise errors.BadIndexOptions(self)

444

445

def _resolve_references(self, references):

446

"""Return the resolved key references for references.

447

448

References are resolved by looking up the location of the key in the

449

_keys_by_offset map and substituting the key name, preserving ordering.

450

451

:param references: An iterable of iterables of key locations. e.g.

452

[[123, 456], [123]]

453

:return: A tuple of tuples of keys.

454

"""

455

node_refs = []

456

for ref_list in references:

457

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

458

return tuple(node_refs)

459

460

def _find_index(self, range_map, key):

461

"""Helper for the _parsed_*_index calls.

462

463

Given a range map - [(start, end), ...], finds the index of the range

464

in the map for key if it is in the map, and if it is not there, the

465

immediately preceeding range in the map.

466

"""

467

result = bisect_right(range_map, key) - 1

468

if result + 1 < len(range_map):

469

# check the border condition, it may be in result + 1

470

if range_map[result + 1][0] == key[0]:

471

return result + 1

472

return result

473

474

def _parsed_byte_index(self, offset):

475

"""Return the index of the entry immediately before offset.

476

477

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

478

there is one unparsed byte (the 11th, addressed as[10]). then:

479

asking for 0 will return 0

480

asking for 10 will return 0

481

asking for 11 will return 1

482

asking for 12 will return 1

483

"""

484

key = (offset, 0)

485

return self._find_index(self._parsed_byte_map, key)

486

487

def _parsed_key_index(self, key):

488

"""Return the index of the entry immediately before key.

489

490

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

491

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

492

have been parsed, then:

493

asking for '' will return 0

494

asking for 'a' will return 0

495

asking for 'b' will return 1

496

asking for 'e' will return 1

497

"""

498

search_key = (key, None)

499

return self._find_index(self._parsed_key_map, search_key)

500

501

def _is_parsed(self, offset):

502

"""Returns True if offset has been parsed."""

503

index = self._parsed_byte_index(offset)

504

if index == len(self._parsed_byte_map):

505

return offset < self._parsed_byte_map[index - 1][1]

506

start, end = self._parsed_byte_map[index]

507

return offset >= start and offset < end

508

509

def _iter_entries_from_total_buffer(self, keys):

510

"""Iterate over keys when the entire index is parsed."""

511

keys = keys.intersection(self._keys)

512

if self.node_ref_lists:

513

for key in keys:

514

value, node_refs = self._nodes[key]

515

yield self, key, value, node_refs

516

else:

517

for key in keys:

518

yield self, key, self._nodes[key]

519

520

def iter_entries(self, keys):

521

"""Iterate over keys within the index.

522

523

:param keys: An iterable providing the keys to be retrieved.

524

:return: An iterable as per iter_all_entries, but restricted to the

525

keys supplied. No additional keys will be returned, and every

526

key supplied that is in the index will be returned.

527

"""

528

keys = set(keys)

529

if not keys:

530

return []

531

if self._size is None and self._nodes is None:

532

self._buffer_all()

533

# We fit about 20 keys per minimum-read (4K), so if we are looking for

534

# more than 1/20th of the index its likely (assuming homogenous key

535

# spread) that we'll read the entire index. If we're going to do that,

536

# buffer the whole thing. A better analysis might take key spread into

537

# account - but B+Tree indices are better anyway.

538

# We could look at all data read, and use a threshold there, which will

539

# trigger on ancestry walks, but that is not yet fully mapped out.

540

if self._nodes is None and len(keys) * 20 > self.key_count():

541

self._buffer_all()

542

if self._nodes is not None:

543

return self._iter_entries_from_total_buffer(keys)

544

else:

545

return (result[1] for result in bisect_multi_bytes(

546

self._lookup_keys_via_location, self._size, keys))

547

548

def iter_entries_prefix(self, keys):

549

"""Iterate over keys within the index using prefix matching.

550

551

Prefix matching is applied within the tuple of a key, not to within

552

the bytestring of each key element. e.g. if you have the keys ('foo',

553

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

554

only the former key is returned.

555

556

WARNING: Note that this method currently causes a full index parse

557

unconditionally (which is reasonably appropriate as it is a means for

558

thunking many small indices into one larger one and still supplies

559

iter_all_entries at the thunk layer).

560

561

:param keys: An iterable providing the key prefixes to be retrieved.

562

Each key prefix takes the form of a tuple the length of a key, but

563

with the last N elements 'None' rather than a regular bytestring.

564

The first element cannot be 'None'.

565

:return: An iterable as per iter_all_entries, but restricted to the

566

keys with a matching prefix to those supplied. No additional keys

567

will be returned, and every match that is in the index will be

568

returned.

569

"""

570

keys = set(keys)

571

if not keys:

572

return

573

# load data - also finds key lengths

574

if self._nodes is None:

575

self._buffer_all()

576

if self._key_length == 1:

577

for key in keys:

578

# sanity check

579

if key[0] is None:

580

raise errors.BadIndexKey(key)

581

if len(key) != self._key_length:

582

raise errors.BadIndexKey(key)

583

if self.node_ref_lists:

584

value, node_refs = self._nodes[key]

585

yield self, key, value, node_refs

586

else:

587

yield self, key, self._nodes[key]

588

return

589

for key in keys:

590

# sanity check

591

if key[0] is None:

592

raise errors.BadIndexKey(key)

593

if len(key) != self._key_length:

594

raise errors.BadIndexKey(key)

595

# find what it refers to:

596

key_dict = self._nodes_by_key

597

elements = list(key)

598

# find the subdict whose contents should be returned.

599

try:

600

while len(elements) and elements[0] is not None:

601

key_dict = key_dict[elements[0]]

602

elements.pop(0)

603

except KeyError:

604

# a non-existant lookup.

605

continue

606

if len(elements):

607

dicts = [key_dict]

608

while dicts:

609

key_dict = dicts.pop(-1)

610

# can't be empty or would not exist

611

item, value = key_dict.iteritems().next()

612

if type(value) == dict:

613

# push keys

614

dicts.extend(key_dict.itervalues())

615

else:

616

# yield keys

617

for value in key_dict.itervalues():

618

# each value is the key:value:node refs tuple

619

# ready to yield.

620

yield (self, ) + value

621

else:

622

# the last thing looked up was a terminal element

623

yield (self, ) + key_dict

624

625

def key_count(self):

626

"""Return an estimate of the number of keys in this index.

627

628

For GraphIndex the estimate is exact.

629

"""

630

if self._key_count is None:

631

self._read_and_parse([_HEADER_READV])

632

return self._key_count

633

634

def _lookup_keys_via_location(self, location_keys):

635

"""Public interface for implementing bisection.

636

637

If _buffer_all has been called, then all the data for the index is in

638

memory, and this method should not be called, as it uses a separate

639

cache because it cannot pre-resolve all indices, which buffer_all does

640

for performance.

641

642

:param location_keys: A list of location(byte offset), key tuples.

643

:return: A list of (location_key, result) tuples as expected by

644

bzrlib.bisect_multi.bisect_multi_bytes.

645

"""

646

# Possible improvements:

647

# - only bisect lookup each key once

648

# - sort the keys first, and use that to reduce the bisection window

649

# -----

650

# this progresses in three parts:

651

# read data

652

# parse it

653

# attempt to answer the question from the now in memory data.

654

# build the readv request

655

# for each location, ask for 800 bytes - much more than rows we've seen

656

# anywhere.

657

readv_ranges = []

658

for location, key in location_keys:

659

# can we answer from cache?

660

if self._bisect_nodes and key in self._bisect_nodes:

661

# We have the key parsed.

662

continue

663

index = self._parsed_key_index(key)

664

if (len(self._parsed_key_map) and

665

self._parsed_key_map[index][0] <= key and

666

(self._parsed_key_map[index][1] >= key or

667

# end of the file has been parsed

668

self._parsed_byte_map[index][1] == self._size)):

669

# the key has been parsed, so no lookup is needed even if its

670

# not present.

671

continue

672

# - if we have examined this part of the file already - yes

673

index = self._parsed_byte_index(location)

674

if (len(self._parsed_byte_map) and

675

self._parsed_byte_map[index][0] <= location and

676

self._parsed_byte_map[index][1] > location):

677

# the byte region has been parsed, so no read is needed.

678

continue

679

length = 800

680

if location + length > self._size:

681

length = self._size - location

682

# todo, trim out parsed locations.

683

if length > 0:

684

readv_ranges.append((location, length))

685

# read the header if needed

686

if self._bisect_nodes is None:

687

readv_ranges.append(_HEADER_READV)

688

self._read_and_parse(readv_ranges)

689

# generate results:

690

# - figure out <, >, missing, present

691

# - result present references so we can return them.

692

result = []

693

# keys that we cannot answer until we resolve references

694

pending_references = []

695

pending_locations = set()

696

for location, key in location_keys:

697

# can we answer from cache?

698

if key in self._bisect_nodes:

699

# the key has been parsed, so no lookup is needed

700

if self.node_ref_lists:

701

# the references may not have been all parsed.

702

value, refs = self._bisect_nodes[key]

703

wanted_locations = []

704

for ref_list in refs:

705

for ref in ref_list:

706

if ref not in self._keys_by_offset:

707

wanted_locations.append(ref)

708

if wanted_locations:

709

pending_locations.update(wanted_locations)

710

pending_references.append((location, key))

711

continue

712

result.append(((location, key), (self, key,

713

value, self._resolve_references(refs))))

714

else:

715

result.append(((location, key),

716

(self, key, self._bisect_nodes[key])))

717

continue

718

else:

719

# has the region the key should be in, been parsed?

720

index = self._parsed_key_index(key)

721

if (self._parsed_key_map[index][0] <= key and

722

(self._parsed_key_map[index][1] >= key or

723

# end of the file has been parsed

724

self._parsed_byte_map[index][1] == self._size)):

725

result.append(((location, key), False))

726

continue

727

# no, is the key above or below the probed location:

728

# get the range of the probed & parsed location

729

index = self._parsed_byte_index(location)

730

# if the key is below the start of the range, its below

731

if key < self._parsed_key_map[index][0]:

732

direction = -1

733

else:

734

direction = +1

735

result.append(((location, key), direction))

736

readv_ranges = []

737

# lookup data to resolve references

738

for location in pending_locations:

739

length = 800

740

if location + length > self._size:

741

length = self._size - location

742

# TODO: trim out parsed locations (e.g. if the 800 is into the

743

# parsed region trim it, and dont use the adjust_for_latency

744

# facility)

745

if length > 0:

746

readv_ranges.append((location, length))

747

self._read_and_parse(readv_ranges)

748

for location, key in pending_references:

749

# answer key references we had to look-up-late.

750

index = self._parsed_key_index(key)

751

value, refs = self._bisect_nodes[key]

752

result.append(((location, key), (self, key,

753

value, self._resolve_references(refs))))

754

return result

755

756

def _parse_header_from_bytes(self, bytes):

757

"""Parse the header from a region of bytes.

758

759

:param bytes: The data to parse.

760

:return: An offset, data tuple such as readv yields, for the unparsed

761

data. (which may length 0).

762

"""

763

signature = bytes[0:len(self._signature())]

764

if not signature == self._signature():

765

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

766

lines = bytes[len(self._signature()):].splitlines()

767

options_line = lines[0]

768

if not options_line.startswith(_OPTION_NODE_REFS):

769

raise errors.BadIndexOptions(self)

770

try:

771

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

772

except ValueError:

773

raise errors.BadIndexOptions(self)

774

options_line = lines[1]

775

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

776

raise errors.BadIndexOptions(self)

777

try:

778

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

779

except ValueError:

780

raise errors.BadIndexOptions(self)

781

options_line = lines[2]

782

if not options_line.startswith(_OPTION_LEN):

783

raise errors.BadIndexOptions(self)

784

try:

785

self._key_count = int(options_line[len(_OPTION_LEN):])

786

except ValueError:

787

raise errors.BadIndexOptions(self)

788

# calculate the bytes we have processed

789

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

790

len(lines[2]) + 3)

791

self._parsed_bytes(0, None, header_end, None)

792

# setup parsing state

793

self._expected_elements = 3 + self._key_length

794

# raw data keyed by offset

795

self._keys_by_offset = {}

796

# keys with the value and node references

797

self._bisect_nodes = {}

798

return header_end, bytes[header_end:]

799

800

def _parse_region(self, offset, data):

801

"""Parse node data returned from a readv operation.

802

803

:param offset: The byte offset the data starts at.

804

:param data: The data to parse.

805

"""

806

# trim the data.

807

# end first:

808

end = offset + len(data)

809

high_parsed = offset

810

while True:

811

# Trivial test - if the current index's end is within the

812

# low-matching parsed range, we're done.

813

index = self._parsed_byte_index(high_parsed)

814

if end < self._parsed_byte_map[index][1]:

815

return

816

# print "[%d:%d]" % (offset, end), \

817

# self._parsed_byte_map[index:index + 2]

818

high_parsed, last_segment = self._parse_segment(

819

offset, data, end, index)

820

if last_segment:

821

return

822

823

def _parse_segment(self, offset, data, end, index):

824

"""Parse one segment of data.

825

826

:param offset: Where 'data' begins in the file.

827

:param data: Some data to parse a segment of.

828

:param end: Where data ends

829

:param index: The current index into the parsed bytes map.

830

:return: True if the parsed segment is the last possible one in the

831

range of data.

832

:return: high_parsed_byte, last_segment.

833

high_parsed_byte is the location of the highest parsed byte in this

834

segment, last_segment is True if the parsed segment is the last

835

possible one in the data block.

836

"""

837

# default is to use all data

838

trim_end = None

839

# accomodate overlap with data before this.

840

if offset < self._parsed_byte_map[index][1]:

841

# overlaps the lower parsed region

842

# skip the parsed data

843

trim_start = self._parsed_byte_map[index][1] - offset

844

# don't trim the start for \n

845

start_adjacent = True

846

elif offset == self._parsed_byte_map[index][1]:

847

# abuts the lower parsed region

848

# use all data

849

trim_start = None

850

# do not trim anything

851

start_adjacent = True

852

else:

853

# does not overlap the lower parsed region

854

# use all data

855

trim_start = None

856

# but trim the leading \n

857

start_adjacent = False

858

if end == self._size:

859

# lines up to the end of all data:

860

# use it all

861

trim_end = None

862

# do not strip to the last \n

863

end_adjacent = True

864

last_segment = True

865

elif index + 1 == len(self._parsed_byte_map):

866

# at the end of the parsed data

867

# use it all

868

trim_end = None

869

# but strip to the last \n

870

end_adjacent = False

871

last_segment = True

872

elif end == self._parsed_byte_map[index + 1][0]:

873

# buts up against the next parsed region

874

# use it all

875

trim_end = None

876

# do not strip to the last \n

877

end_adjacent = True

878

last_segment = True

879

elif end > self._parsed_byte_map[index + 1][0]:

880

# overlaps into the next parsed region

881

# only consider the unparsed data

882

trim_end = self._parsed_byte_map[index + 1][0] - offset

883

# do not strip to the last \n as we know its an entire record

884

end_adjacent = True

885

last_segment = end < self._parsed_byte_map[index + 1][1]

886

else:

887

# does not overlap into the next region

888

# use it all

889

trim_end = None

890

# but strip to the last \n

891

end_adjacent = False

892

last_segment = True

893

# now find bytes to discard if needed

894

if not start_adjacent:

895

# work around python bug in rfind

896

if trim_start is None:

897

trim_start = data.find('\n') + 1

898

else:

899

trim_start = data.find('\n', trim_start) + 1

900

if not (trim_start != 0):

901

raise AssertionError('no \n was present')

902

# print 'removing start', offset, trim_start, repr(data[:trim_start])

903

if not end_adjacent:

904

# work around python bug in rfind

905

if trim_end is None:

906

trim_end = data.rfind('\n') + 1

907

else:

908

trim_end = data.rfind('\n', None, trim_end) + 1

909

if not (trim_end != 0):

910

raise AssertionError('no \n was present')

911

# print 'removing end', offset, trim_end, repr(data[trim_end:])

912

# adjust offset and data to the parseable data.

913

trimmed_data = data[trim_start:trim_end]

914

if not (trimmed_data):

915

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

916

% (trim_start, trim_end, offset, offset + len(data)))

917

if trim_start:

918

offset += trim_start

919

# print "parsing", repr(trimmed_data)

920

# splitlines mangles the \r delimiters.. don't use it.

921

lines = trimmed_data.split('\n')

922

del lines[-1]

923

pos = offset

924

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

925

for key, value in nodes:

926

self._bisect_nodes[key] = value

927

self._parsed_bytes(offset, first_key,

928

offset + len(trimmed_data), last_key)

929

return offset + len(trimmed_data), last_segment

930

931

def _parse_lines(self, lines, pos):

932

key = None

933

first_key = None

934

trailers = 0

935

nodes = []

936

for line in lines:

937

if line == '':

938

# must be at the end

939

if self._size:

940

if not (self._size == pos + 1):

941

raise AssertionError("%s %s" % (self._size, pos))

942

trailers += 1

943

continue

944

elements = line.split('\0')

945

if len(elements) != self._expected_elements:

946

raise errors.BadIndexData(self)

947

# keys are tuples. Each element is a string that may occur many

948

# times, so we intern them to save space. AB, RC, 200807

949

key = tuple(intern(element) for element in elements[:self._key_length])

950

if first_key is None:

951

first_key = key

952

absent, references, value = elements[-3:]

953

ref_lists = []

954

for ref_string in references.split('\t'):

955

ref_lists.append(tuple([

956

int(ref) for ref in ref_string.split('\r') if ref

957

]))

958

ref_lists = tuple(ref_lists)

959

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

960

pos += len(line) + 1 # +1 for the \n

961

if absent:

962

continue

963

if self.node_ref_lists:

964

node_value = (value, ref_lists)

965

else:

966

node_value = value

967

nodes.append((key, node_value))

968

# print "parsed ", key

969

return first_key, key, nodes, trailers

970

971

def _parsed_bytes(self, start, start_key, end, end_key):

972

"""Mark the bytes from start to end as parsed.

973

974

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

975

1) as parsed.

976

977

:param start: The start of the parsed region.

978

:param end: The end of the parsed region.

979

"""

980

index = self._parsed_byte_index(start)

981

new_value = (start, end)

982

new_key = (start_key, end_key)

983

if index == -1:

984

# first range parsed is always the beginning.

985

self._parsed_byte_map.insert(index, new_value)

986

self._parsed_key_map.insert(index, new_key)

987

return

988

# four cases:

989

# new region

990

# extend lower region

991

# extend higher region

992

# combine two regions

993

if (index + 1 < len(self._parsed_byte_map) and

994

self._parsed_byte_map[index][1] == start and

995

self._parsed_byte_map[index + 1][0] == end):

996

# combine two regions

997

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

998

self._parsed_byte_map[index + 1][1])

999

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1000

self._parsed_key_map[index + 1][1])

1001

del self._parsed_byte_map[index + 1]

1002

del self._parsed_key_map[index + 1]

1003

elif self._parsed_byte_map[index][1] == start:

1004

# extend the lower entry

1005

self._parsed_byte_map[index] = (

1006

self._parsed_byte_map[index][0], end)

1007

self._parsed_key_map[index] = (

1008

self._parsed_key_map[index][0], end_key)

1009

elif (index + 1 < len(self._parsed_byte_map) and

1010

self._parsed_byte_map[index + 1][0] == end):

1011

# extend the higher entry

1012

self._parsed_byte_map[index + 1] = (

1013

start, self._parsed_byte_map[index + 1][1])

1014

self._parsed_key_map[index + 1] = (

1015

start_key, self._parsed_key_map[index + 1][1])

1016

else:

1017

# new entry

1018

self._parsed_byte_map.insert(index + 1, new_value)

1019

self._parsed_key_map.insert(index + 1, new_key)

1020

1021

def _read_and_parse(self, readv_ranges):

1022

"""Read the the ranges and parse the resulting data.

1023

1024

:param readv_ranges: A prepared readv range list.

1025

"""

1026

if readv_ranges:

1027

readv_data = self._transport.readv(self._name, readv_ranges, True,

1028

self._size)

1029

# parse

1030

for offset, data in readv_data:

1031

if self._bisect_nodes is None:

1032

# this must be the start

1033

if not (offset == 0):

1034

raise AssertionError()

1035

offset, data = self._parse_header_from_bytes(data)

1036

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1037

self._parse_region(offset, data)

1038

1039

def _signature(self):

1040

"""The file signature for this index type."""

1041

return _SIGNATURE

1042

1043

def validate(self):

1044

"""Validate that everything in the index can be accessed."""

1045

# iter_all validates completely at the moment, so just do that.

1046

for node in self.iter_all_entries():

1047

pass

1048

1049

1050

class CombinedGraphIndex(object):

1051

"""A GraphIndex made up from smaller GraphIndices.

1052

1053

The backing indices must implement GraphIndex, and are presumed to be

1054

static data.

1055

1056

Queries against the combined index will be made against the first index,

1057

and then the second and so on. The order of index's can thus influence

1058

performance significantly. For example, if one index is on local disk and a

1059

second on a remote server, the local disk index should be before the other

1060

in the index list.

1061

"""

1062

1063

def __init__(self, indices):

1064

"""Create a CombinedGraphIndex backed by indices.

1065

1066

:param indices: An ordered list of indices to query for data.

1067

"""

1068

self._indices = indices

1069

1070

def __repr__(self):

1071

return "%s(%s)" % (

1072

self.__class__.__name__,

1073

', '.join(map(repr, self._indices)))

1074

1075

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1076

def get_parents(self, revision_ids):

1077

"""See graph._StackedParentsProvider.get_parents.

1078

1079

This implementation thunks the graph.Graph.get_parents api across to

1080

GraphIndex.

1081

1082

:param revision_ids: An iterable of graph keys for this graph.

1083

:return: A list of parent details for each key in revision_ids.

1084

Each parent details will be one of:

1085

* None when the key was missing

1086

* (NULL_REVISION,) when the key has no parents.

1087

* (parent_key, parent_key...) otherwise.

1088

"""

1089

parent_map = self.get_parent_map(revision_ids)

1090

return [parent_map.get(r, None) for r in revision_ids]

1091

1092

def get_parent_map(self, keys):

1093

"""See graph._StackedParentsProvider.get_parent_map"""

1094

search_keys = set(keys)

1095

if NULL_REVISION in search_keys:

1096

search_keys.discard(NULL_REVISION)

1097

found_parents = {NULL_REVISION:[]}

1098

else:

1099

found_parents = {}

1100

for index, key, value, refs in self.iter_entries(search_keys):

1101

parents = refs[0]

1102

if not parents:

1103

parents = (NULL_REVISION,)

1104

found_parents[key] = parents

1105

return found_parents

1106

1107

def insert_index(self, pos, index):

1108

"""Insert a new index in the list of indices to query.

1109

1110

:param pos: The position to insert the index.

1111

:param index: The index to insert.

1112

"""

1113

self._indices.insert(pos, index)

1114

1115

def iter_all_entries(self):

1116

"""Iterate over all keys within the index

1117

1118

Duplicate keys across child indices are presumed to have the same

1119

value and are only reported once.

1120

1121

:return: An iterable of (index, key, reference_lists, value).

1122

There is no defined order for the result iteration - it will be in

1123

the most efficient order for the index.

1124

"""

1125

seen_keys = set()

1126

for index in self._indices:

1127

for node in index.iter_all_entries():

1128

if node[1] not in seen_keys:

1129

yield node

1130

seen_keys.add(node[1])

1131

1132

def iter_entries(self, keys):

1133

"""Iterate over keys within the index.

1134

1135

Duplicate keys across child indices are presumed to have the same

1136

value and are only reported once.

1137

1138

:param keys: An iterable providing the keys to be retrieved.

1139

:return: An iterable of (index, key, reference_lists, value). There is no

1140

defined order for the result iteration - it will be in the most

1141

efficient order for the index.

1142

"""

1143

keys = set(keys)

1144

for index in self._indices:

1145

if not keys:

1146

return

1147

for node in index.iter_entries(keys):

1148

keys.remove(node[1])

1149

yield node

1150

1151

def iter_entries_prefix(self, keys):

1152

"""Iterate over keys within the index using prefix matching.

1153

1154

Duplicate keys across child indices are presumed to have the same

1155

value and are only reported once.

1156

1157

Prefix matching is applied within the tuple of a key, not to within

1158

the bytestring of each key element. e.g. if you have the keys ('foo',

1159

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1160

only the former key is returned.

1161

1162

:param keys: An iterable providing the key prefixes to be retrieved.

1163

Each key prefix takes the form of a tuple the length of a key, but

1164

with the last N elements 'None' rather than a regular bytestring.

1165

The first element cannot be 'None'.

1166

:return: An iterable as per iter_all_entries, but restricted to the

1167

keys with a matching prefix to those supplied. No additional keys

1168

will be returned, and every match that is in the index will be

1169

returned.

1170

"""

1171

keys = set(keys)

1172

if not keys:

1173

return

1174

seen_keys = set()

1175

for index in self._indices:

1176

for node in index.iter_entries_prefix(keys):

1177

if node[1] in seen_keys:

1178

continue

1179

seen_keys.add(node[1])

1180

yield node

1181

1182

def key_count(self):

1183

"""Return an estimate of the number of keys in this index.

1184

1185

For CombinedGraphIndex this is approximated by the sum of the keys of

1186

the child indices. As child indices may have duplicate keys this can

1187

have a maximum error of the number of child indices * largest number of

1188

keys in any index.

1189

"""

1190

return sum((index.key_count() for index in self._indices), 0)

1191

1192

def validate(self):

1193

"""Validate that everything in the index can be accessed."""

1194

for index in self._indices:

1195

index.validate()

1196

1197

1198

class InMemoryGraphIndex(GraphIndexBuilder):

1199

"""A GraphIndex which operates entirely out of memory and is mutable.

1200

1201

This is designed to allow the accumulation of GraphIndex entries during a

1202

single write operation, where the accumulated entries need to be immediately

1203

available - for example via a CombinedGraphIndex.

1204

"""

1205

1206

def add_nodes(self, nodes):

1207

"""Add nodes to the index.

1208

1209

:param nodes: An iterable of (key, node_refs, value) entries to add.

1210

"""

1211

if self.reference_lists:

1212

for (key, value, node_refs) in nodes:

1213

self.add_node(key, value, node_refs)

1214

else:

1215

for (key, value) in nodes:

1216

self.add_node(key, value)

1217

1218

def iter_all_entries(self):

1219

"""Iterate over all keys within the index

1220

1221

:return: An iterable of (index, key, reference_lists, value). There is no

1222

defined order for the result iteration - it will be in the most

1223

efficient order for the index (in this case dictionary hash order).

1224

"""

1225

if 'evil' in debug.debug_flags:

1226

trace.mutter_callsite(3,

1227

"iter_all_entries scales with size of history.")

1228

if self.reference_lists:

1229

for key, (absent, references, value) in self._nodes.iteritems():

1230

if not absent:

1231

yield self, key, value, references

1232

else:

1233

for key, (absent, references, value) in self._nodes.iteritems():

1234

if not absent:

1235

yield self, key, value

1236

1237

def iter_entries(self, keys):

1238

"""Iterate over keys within the index.

1239

1240

:param keys: An iterable providing the keys to be retrieved.

1241

:return: An iterable of (index, key, value, reference_lists). There is no

1242

defined order for the result iteration - it will be in the most

1243

efficient order for the index (keys iteration order in this case).

1244

"""

1245

keys = set(keys)

1246

if self.reference_lists:

1247

for key in keys.intersection(self._keys):

1248

node = self._nodes[key]

1249

if not node[0]:

1250

yield self, key, node[2], node[1]

1251

else:

1252

for key in keys.intersection(self._keys):

1253

node = self._nodes[key]

1254

if not node[0]:

1255

yield self, key, node[2]

1256

1257

def iter_entries_prefix(self, keys):

1258

"""Iterate over keys within the index using prefix matching.

1259

1260

Prefix matching is applied within the tuple of a key, not to within

1261

the bytestring of each key element. e.g. if you have the keys ('foo',

1262

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1263

only the former key is returned.

1264

1265

:param keys: An iterable providing the key prefixes to be retrieved.

1266

Each key prefix takes the form of a tuple the length of a key, but

1267

with the last N elements 'None' rather than a regular bytestring.

1268

The first element cannot be 'None'.

1269

:return: An iterable as per iter_all_entries, but restricted to the

1270

keys with a matching prefix to those supplied. No additional keys

1271

will be returned, and every match that is in the index will be

1272

returned.

1273

"""

1274

# XXX: To much duplication with the GraphIndex class; consider finding

1275

# a good place to pull out the actual common logic.

1276

keys = set(keys)

1277

if not keys:

1278

return

1279

if self._key_length == 1:

1280

for key in keys:

1281

# sanity check

1282

if key[0] is None:

1283

raise errors.BadIndexKey(key)

1284

if len(key) != self._key_length:

1285

raise errors.BadIndexKey(key)

1286

node = self._nodes[key]

1287

if node[0]:

1288

continue

1289

if self.reference_lists:

1290

yield self, key, node[2], node[1]

1291

else:

1292

yield self, key, node[2]

1293

return

1294

nodes_by_key = self._get_nodes_by_key()

1295

for key in keys:

1296

# sanity check

1297

if key[0] is None:

1298

raise errors.BadIndexKey(key)

1299

if len(key) != self._key_length:

1300

raise errors.BadIndexKey(key)

1301

# find what it refers to:

1302

key_dict = nodes_by_key

1303

elements = list(key)

1304

# find the subdict to return

1305

try:

1306

while len(elements) and elements[0] is not None:

1307

key_dict = key_dict[elements[0]]

1308

elements.pop(0)

1309

except KeyError:

1310

# a non-existant lookup.

1311

continue

1312

if len(elements):

1313

dicts = [key_dict]

1314

while dicts:

1315

key_dict = dicts.pop(-1)

1316

# can't be empty or would not exist

1317

item, value = key_dict.iteritems().next()

1318

if type(value) == dict:

1319

# push keys

1320

dicts.extend(key_dict.itervalues())

1321

else:

1322

# yield keys

1323

for value in key_dict.itervalues():

1324

yield (self, ) + value

1325

else:

1326

yield (self, ) + key_dict

1327

1328

def key_count(self):

1329

"""Return an estimate of the number of keys in this index.

1330

1331

For InMemoryGraphIndex the estimate is exact.

1332

"""

1333

return len(self._keys)

1334

1335

def validate(self):

1336

"""In memory index's have no known corruption at the moment."""

1337

1338

1339

class GraphIndexPrefixAdapter(object):

1340

"""An adapter between GraphIndex with different key lengths.

1341

1342

Queries against this will emit queries against the adapted Graph with the

1343

prefix added, queries for all items use iter_entries_prefix. The returned

1344

nodes will have their keys and node references adjusted to remove the

1345

prefix. Finally, an add_nodes_callback can be supplied - when called the

1346

nodes and references being added will have prefix prepended.

1347

"""

1348

1349

def __init__(self, adapted, prefix, missing_key_length,

1350

add_nodes_callback=None):

1351

"""Construct an adapter against adapted with prefix."""

1352

self.adapted = adapted

1353

self.prefix_key = prefix + (None,)*missing_key_length

1354

self.prefix = prefix

1355

self.prefix_len = len(prefix)

1356

self.add_nodes_callback = add_nodes_callback

1357

1358

def add_nodes(self, nodes):

1359

"""Add nodes to the index.

1360

1361

:param nodes: An iterable of (key, node_refs, value) entries to add.

1362

"""

1363

# save nodes in case its an iterator

1364

nodes = tuple(nodes)

1365

translated_nodes = []

1366

try:

1367

# Add prefix_key to each reference node_refs is a tuple of tuples,

1368

# so split it apart, and add prefix_key to the internal reference

1369

for (key, value, node_refs) in nodes:

1370

adjusted_references = (

1371

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1372

for ref_list in node_refs))

1373

translated_nodes.append((self.prefix + key, value,

1374

adjusted_references))

1375

except ValueError:

1376

# XXX: TODO add an explicit interface for getting the reference list

1377

# status, to handle this bit of user-friendliness in the API more

1378

# explicitly.

1379

for (key, value) in nodes:

1380

translated_nodes.append((self.prefix + key, value))

1381

self.add_nodes_callback(translated_nodes)

1382

1383

def add_node(self, key, value, references=()):

1384

"""Add a node to the index.

1385

1386

:param key: The key. keys are non-empty tuples containing

1387

as many whitespace-free utf8 bytestrings as the key length

1388

defined for this index.

1389

:param references: An iterable of iterables of keys. Each is a

1390

reference to another key.

1391

:param value: The value to associate with the key. It may be any

1392

bytes as long as it does not contain \0 or \n.

1393

"""

1394

self.add_nodes(((key, value, references), ))

1395

1396

def _strip_prefix(self, an_iter):

1397

"""Strip prefix data from nodes and return it."""

1398

for node in an_iter:

1399

# cross checks

1400

if node[1][:self.prefix_len] != self.prefix:

1401

raise errors.BadIndexData(self)

1402

for ref_list in node[3]:

1403

for ref_node in ref_list:

1404

if ref_node[:self.prefix_len] != self.prefix:

1405

raise errors.BadIndexData(self)

1406

yield node[0], node[1][self.prefix_len:], node[2], (

1407

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1408

for ref_list in node[3]))

1409

1410

def iter_all_entries(self):

1411

"""Iterate over all keys within the index

1412

1413

iter_all_entries is implemented against the adapted index using

1414

iter_entries_prefix.

1415

1416

:return: An iterable of (index, key, reference_lists, value). There is no

1417

defined order for the result iteration - it will be in the most

1418

efficient order for the index (in this case dictionary hash order).

1419

"""

1420

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1421

1422

def iter_entries(self, keys):

1423

"""Iterate over keys within the index.

1424

1425

:param keys: An iterable providing the keys to be retrieved.

1426

:return: An iterable of (index, key, value, reference_lists). There is no

1427

defined order for the result iteration - it will be in the most

1428

efficient order for the index (keys iteration order in this case).

1429

"""

1430

return self._strip_prefix(self.adapted.iter_entries(

1431

self.prefix + key for key in keys))

1432

1433

def iter_entries_prefix(self, keys):

1434

"""Iterate over keys within the index using prefix matching.

1435

1436

Prefix matching is applied within the tuple of a key, not to within

1437

the bytestring of each key element. e.g. if you have the keys ('foo',

1438

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1439

only the former key is returned.

1440

1441

:param keys: An iterable providing the key prefixes to be retrieved.

1442

Each key prefix takes the form of a tuple the length of a key, but

1443

with the last N elements 'None' rather than a regular bytestring.

1444

The first element cannot be 'None'.

1445

:return: An iterable as per iter_all_entries, but restricted to the

1446

keys with a matching prefix to those supplied. No additional keys

1447

will be returned, and every match that is in the index will be

1448

returned.

1449

"""

1450

return self._strip_prefix(self.adapted.iter_entries_prefix(

1451

self.prefix + key for key in keys))

1452

1453

def key_count(self):

1454

"""Return an estimate of the number of keys in this index.

1455

1456

For GraphIndexPrefixAdapter this is relatively expensive - key

1457

iteration with the prefix is done.

1458

"""

1459

return len(list(self.iter_all_entries()))

1460

1461

def validate(self):

1462

"""Call the adapted's validate."""

1463

self.adapted.validate()

Older »