/brz/remove-bazaar : revision 4679.3.76

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: John Arbash Meinel
Date: 2009-10-07 15:48:32 UTC
mto: (4679.6.1 2.1-export-c-api)
mto: This revision was merged to the branch mainline in revision 4735.
Revision ID: john@arbash-meinel.com-20091007154832-lpipxg46lynh9wmr

Rename StaticTupleInterner => SimpleSet.

This is a bit more appropriate, because the internal data type is not
specialized into StaticTuple objects only. Partially because I didn't
see a specific memory/speed tradeoff to caching the hash, and
that accessing said hash was siginficantly faster than just
calling PyObject_Hash().

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/history2revfiles.py

tools/http_client.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

commands.py

converter.py

dir.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

notes

notes/roundtripping.txt

remote.py

repository.py

revspec.py

server.py

setup.py

shamap.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_fetch.py

tests/test_ids.py

tests/test_repository.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

)

from bzrlib._static_tuple_c import StaticTuple

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

100

self._key_length = key_elements

101

self._optimize_for_size = False

102

self._combine_backing_indices = True

103

104

def _check_key(self, key):

105

"""Raise BadIndexKey if key is not a valid key for this index."""

106

if type(key) not in (tuple, StaticTuple):

107

raise errors.BadIndexKey(key)

108

if self._key_length != len(key):

109

raise errors.BadIndexKey(key)

110

for element in key:

111

if not element or _whitespace_re.search(element) is not None:

112

raise errors.BadIndexKey(element)

113

114

def _external_references(self):

115

"""Return references that are not present in this index.

116

"""

117

keys = set()

118

refs = set()

119

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

120

# lists are used. It is currently correct for pack-0.92 through

121

# 1.9, which use the node references (3rd column) second

122

# reference list as the compression parent. Perhaps this should

123

# be moved into something higher up the stack, since it

124

# makes assumptions about how the index is used.

125

if self.reference_lists > 1:

126

for node in self.iter_all_entries():

127

keys.add(node[1])

128

refs.update(node[3][1])

129

return refs - keys

130

else:

131

# If reference_lists == 0 there can be no external references, and

132

# if reference_lists == 1, then there isn't a place to store the

133

# compression parent

134

return set()

135

136

def _get_nodes_by_key(self):

137

if self._nodes_by_key is None:

138

nodes_by_key = {}

139

if self.reference_lists:

140

for key, (absent, references, value) in self._nodes.iteritems():

141

if absent:

142

continue

143

key_dict = nodes_by_key

144

for subkey in key[:-1]:

145

key_dict = key_dict.setdefault(subkey, {})

146

key_dict[key[-1]] = key, value, references

147

else:

148

for key, (absent, references, value) in self._nodes.iteritems():

149

if absent:

150

continue

151

key_dict = nodes_by_key

152

for subkey in key[:-1]:

153

key_dict = key_dict.setdefault(subkey, {})

154

key_dict[key[-1]] = key, value

155

self._nodes_by_key = nodes_by_key

156

return self._nodes_by_key

157

158

def _update_nodes_by_key(self, key, value, node_refs):

159

"""Update the _nodes_by_key dict with a new key.

160

161

For a key of (foo, bar, baz) create

162

_nodes_by_key[foo][bar][baz] = key_value

163

"""

164

if self._nodes_by_key is None:

165

return

166

key_dict = self._nodes_by_key

167

if self.reference_lists:

168

key_value = key, value, node_refs

169

else:

170

key_value = key, value

171

for subkey in key[:-1]:

172

key_dict = key_dict.setdefault(subkey, {})

173

key_dict[key[-1]] = key_value

174

175

def _check_key_ref_value(self, key, references, value):

176

"""Check that 'key' and 'references' are all valid.

177

178

:param key: A key tuple. Must conform to the key interface (be a tuple,

179

be of the right length, not have any whitespace or nulls in any key

180

element.)

181

:param references: An iterable of reference lists. Something like

182

[[(ref, key)], [(ref, key), (other, key)]]

183

:param value: The value associate with this key. Must not contain

184

newlines or null characters.

185

:return: (node_refs, absent_references)

186

node_refs basically a packed form of 'references' where all

187

iterables are tuples

188

absent_references reference keys that are not in self._nodes.

189

This may contain duplicates if the same key is

190

referenced in multiple lists.

191

"""

192

self._check_key(key)

193

if _newline_null_re.search(value) is not None:

194

raise errors.BadIndexValue(value)

195

if len(references) != self.reference_lists:

196

raise errors.BadIndexValue(references)

197

node_refs = []

198

absent_references = []

199

for reference_list in references:

200

for reference in reference_list:

201

# If reference *is* in self._nodes, then we know it has already

202

# been checked.

203

if reference not in self._nodes:

204

self._check_key(reference)

205

absent_references.append(reference)

206

node_refs.append(tuple(reference_list))

207

return tuple(node_refs), absent_references

208

209

def add_node(self, key, value, references=()):

210

"""Add a node to the index.

211

212

:param key: The key. keys are non-empty tuples containing

213

as many whitespace-free utf8 bytestrings as the key length

214

defined for this index.

215

:param references: An iterable of iterables of keys. Each is a

216

reference to another key.

217

:param value: The value to associate with the key. It may be any

218

bytes as long as it does not contain \0 or \n.

219

"""

220

(node_refs,

221

absent_references) = self._check_key_ref_value(key, references, value)

222

if key in self._nodes and self._nodes[key][0] != 'a':

223

raise errors.BadIndexDuplicateKey(key, self)

224

for reference in absent_references:

225

# There may be duplicates, but I don't think it is worth worrying

226

# about

227

self._nodes[reference] = ('a', (), '')

228

self._nodes[key] = ('', node_refs, value)

229

self._keys.add(key)

230

if self._nodes_by_key is not None and self._key_length > 1:

231

self._update_nodes_by_key(key, value, node_refs)

232

233

def finish(self):

234

lines = [_SIGNATURE]

235

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

236

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

237

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

238

prefix_length = sum(len(x) for x in lines)

239

# references are byte offsets. To avoid having to do nasty

240

# polynomial work to resolve offsets (references to later in the

241

# file cannot be determined until all the inbetween references have

242

# been calculated too) we pad the offsets with 0's to make them be

243

# of consistent length. Using binary offsets would break the trivial

244

# file parsing.

245

# to calculate the width of zero's needed we do three passes:

246

# one to gather all the non-reference data and the number of references.

247

# one to pad all the data with reference-length and determine entry

248

# addresses.

249

# One to serialise.

250

251

# forward sorted by key. In future we may consider topological sorting,

252

# at the cost of table scans for direct lookup, or a second index for

253

# direct lookup

254

nodes = sorted(self._nodes.items())

255

# if we do not prepass, we don't know how long it will be up front.

256

expected_bytes = None

257

# we only need to pre-pass if we have reference lists at all.

258

if self.reference_lists:

259

key_offset_info = []

260

non_ref_bytes = prefix_length

261

total_references = 0

262

# TODO use simple multiplication for the constants in this loop.

263

for key, (absent, references, value) in nodes:

264

# record the offset known *so far* for this key:

265

# the non reference bytes to date, and the total references to

266

# date - saves reaccumulating on the second pass

267

key_offset_info.append((key, non_ref_bytes, total_references))

268

# key is literal, value is literal, there are 3 null's, 1 NL

269

# key is variable length tuple, \x00 between elements

270

non_ref_bytes += sum(len(element) for element in key)

271

if self._key_length > 1:

272

non_ref_bytes += self._key_length - 1

273

# value is literal bytes, there are 3 null's, 1 NL.

274

non_ref_bytes += len(value) + 3 + 1

275

# one byte for absent if set.

276

if absent:

277

non_ref_bytes += 1

278

elif self.reference_lists:

279

# (ref_lists -1) tabs

280

non_ref_bytes += self.reference_lists - 1

281

# (ref-1 cr's per ref_list)

282

for ref_list in references:

283

# how many references across the whole file?

284

total_references += len(ref_list)

285

# accrue reference separators

286

if ref_list:

287

non_ref_bytes += len(ref_list) - 1

288

# how many digits are needed to represent the total byte count?

289

digits = 1

290

possible_total_bytes = non_ref_bytes + total_references*digits

291

while 10 ** digits < possible_total_bytes:

292

digits += 1

293

possible_total_bytes = non_ref_bytes + total_references*digits

294

expected_bytes = possible_total_bytes + 1 # terminating newline

295

# resolve key addresses.

296

key_addresses = {}

297

for key, non_ref_bytes, total_references in key_offset_info:

298

key_addresses[key] = non_ref_bytes + total_references*digits

299

# serialise

300

format_string = '%%0%sd' % digits

301

for key, (absent, references, value) in nodes:

302

flattened_references = []

303

for ref_list in references:

304

ref_addresses = []

305

for reference in ref_list:

306

ref_addresses.append(format_string % key_addresses[reference])

307

flattened_references.append('\r'.join(ref_addresses))

308

string_key = '\x00'.join(key)

309

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

310

'\t'.join(flattened_references), value))

311

lines.append('\n')

312

result = StringIO(''.join(lines))

313

if expected_bytes and len(result.getvalue()) != expected_bytes:

314

raise errors.BzrError('Failed index creation. Internal error:'

315

' mismatched output length and expected length: %d %d' %

316

(len(result.getvalue()), expected_bytes))

317

return result

318

319

def set_optimize(self, for_size=None, combine_backing_indices=None):

320

"""Change how the builder tries to optimize the result.

321

322

:param for_size: Tell the builder to try and make the index as small as

323

possible.

324

:param combine_backing_indices: If the builder spills to disk to save

325

memory, should the on-disk indices be combined. Set to True if you

326

are going to be probing the index, but to False if you are not. (If

327

you are not querying, then the time spent combining is wasted.)

328

:return: None

329

"""

330

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

331

# other builders do.

332

if for_size is not None:

333

self._optimize_for_size = for_size

334

if combine_backing_indices is not None:

335

self._combine_backing_indices = combine_backing_indices

336

337

def find_ancestry(self, keys, ref_list_num):

338

"""See CombinedGraphIndex.find_ancestry()"""

339

pending = set(keys)

340

parent_map = {}

341

missing_keys = set()

342

while pending:

343

next_pending = set()

344

for _, key, value, ref_lists in self.iter_entries(pending):

345

parent_keys = ref_lists[ref_list_num]

346

parent_map[key] = parent_keys

347

next_pending.update([p for p in parent_keys if p not in

348

parent_map])

349

missing_keys.update(pending.difference(parent_map))

350

pending = next_pending

351

return parent_map, missing_keys

352

353

354

class GraphIndex(object):

355

"""An index for data with embedded graphs.

356

357

The index maps keys to a list of key reference lists, and a value.

358

Each node has the same number of key reference lists. Each key reference

359

list can be empty or an arbitrary length. The value is an opaque NULL

360

terminated string without any newlines. The storage of the index is

361

hidden in the interface: keys and key references are always tuples of

362

bytestrings, never the internal representation (e.g. dictionary offsets).

363

364

It is presumed that the index will not be mutated - it is static data.

365

366

Successive iter_all_entries calls will read the entire index each time.

367

Additionally, iter_entries calls will read the index linearly until the

368

desired keys are found. XXX: This must be fixed before the index is

369

suitable for production use. :XXX

370

"""

371

372

def __init__(self, transport, name, size):

373

"""Open an index called name on transport.

374

375

:param transport: A bzrlib.transport.Transport.

376

:param name: A path to provide to transport API calls.

377

:param size: The size of the index in bytes. This is used for bisection

378

logic to perform partial index reads. While the size could be

379

obtained by statting the file this introduced an additional round

380

trip as well as requiring stat'able transports, both of which are

381

avoided by having it supplied. If size is None, then bisection

382

support will be disabled and accessing the index will just stream

383

all the data.

384

"""

385

self._transport = transport

386

self._name = name

387

# Becomes a dict of key:(value, reference-list-byte-locations) used by

388

# the bisection interface to store parsed but not resolved keys.

389

self._bisect_nodes = None

390

# Becomes a dict of key:(value, reference-list-keys) which are ready to

391

# be returned directly to callers.

392

self._nodes = None

393

# a sorted list of slice-addresses for the parsed bytes of the file.

394

# e.g. (0,1) would mean that byte 0 is parsed.

395

self._parsed_byte_map = []

396

# a sorted list of keys matching each slice address for parsed bytes

397

# e.g. (None, 'foo@bar') would mean that the first byte contained no

398

# key, and the end byte of the slice is the of the data for 'foo@bar'

399

self._parsed_key_map = []

400

self._key_count = None

401

self._keys_by_offset = None

402

self._nodes_by_key = None

403

self._size = size

404

# The number of bytes we've read so far in trying to process this file

405

self._bytes_read = 0

406

407

def __eq__(self, other):

408

"""Equal when self and other were created with the same parameters."""

409

return (

410

type(self) == type(other) and

411

self._transport == other._transport and

412

self._name == other._name and

413

self._size == other._size)

414

415

def __ne__(self, other):

416

return not self.__eq__(other)

417

418

def __repr__(self):

419

return "%s(%r)" % (self.__class__.__name__,

420

self._transport.abspath(self._name))

421

422

def _buffer_all(self, stream=None):

423

"""Buffer all the index data.

424

425

Mutates self._nodes and self.keys_by_offset.

426

"""

427

if self._nodes is not None:

428

# We already did this

429

return

430

if 'index' in debug.debug_flags:

431

mutter('Reading entire index %s', self._transport.abspath(self._name))

432

if stream is None:

433

stream = self._transport.get(self._name)

434

self._read_prefix(stream)

435

self._expected_elements = 3 + self._key_length

436

line_count = 0

437

# raw data keyed by offset

438

self._keys_by_offset = {}

439

# ready-to-return key:value or key:value, node_ref_lists

440

self._nodes = {}

441

self._nodes_by_key = None

442

trailers = 0

443

pos = stream.tell()

444

lines = stream.read().split('\n')

445

del lines[-1]

446

_, _, _, trailers = self._parse_lines(lines, pos)

447

for key, absent, references, value in self._keys_by_offset.itervalues():

448

if absent:

449

continue

450

# resolve references:

451

if self.node_ref_lists:

452

node_value = (value, self._resolve_references(references))

453

else:

454

node_value = value

455

self._nodes[key] = node_value

456

# cache the keys for quick set intersections

457

self._keys = set(self._nodes)

458

if trailers != 1:

459

# there must be one line - the empty trailer line.

460

raise errors.BadIndexData(self)

461

462

def external_references(self, ref_list_num):

463

"""Return references that are not present in this index.

464

"""

465

self._buffer_all()

466

if ref_list_num + 1 > self.node_ref_lists:

467

raise ValueError('No ref list %d, index has %d ref lists'

468

% (ref_list_num, self.node_ref_lists))

469

refs = set()

470

for key, (value, ref_lists) in self._nodes.iteritems():

471

ref_list = ref_lists[ref_list_num]

472

refs.update(ref_list)

473

return refs - self._keys

474

475

def _get_nodes_by_key(self):

476

if self._nodes_by_key is None:

477

nodes_by_key = {}

478

if self.node_ref_lists:

479

for key, (value, references) in self._nodes.iteritems():

480

key_dict = nodes_by_key

481

for subkey in key[:-1]:

482

key_dict = key_dict.setdefault(subkey, {})

483

key_dict[key[-1]] = key, value, references

484

else:

485

for key, value in self._nodes.iteritems():

486

key_dict = nodes_by_key

487

for subkey in key[:-1]:

488

key_dict = key_dict.setdefault(subkey, {})

489

key_dict[key[-1]] = key, value

490

self._nodes_by_key = nodes_by_key

491

return self._nodes_by_key

492

493

def iter_all_entries(self):

494

"""Iterate over all keys within the index.

495

496

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

497

The former tuple is used when there are no reference lists in the

498

index, making the API compatible with simple key:value index types.

499

There is no defined order for the result iteration - it will be in

500

the most efficient order for the index.

501

"""

502

if 'evil' in debug.debug_flags:

503

trace.mutter_callsite(3,

504

"iter_all_entries scales with size of history.")

505

if self._nodes is None:

506

self._buffer_all()

507

if self.node_ref_lists:

508

for key, (value, node_ref_lists) in self._nodes.iteritems():

509

yield self, key, value, node_ref_lists

510

else:

511

for key, value in self._nodes.iteritems():

512

yield self, key, value

513

514

def _read_prefix(self, stream):

515

signature = stream.read(len(self._signature()))

516

if not signature == self._signature():

517

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

518

options_line = stream.readline()

519

if not options_line.startswith(_OPTION_NODE_REFS):

520

raise errors.BadIndexOptions(self)

521

try:

522

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

523

except ValueError:

524

raise errors.BadIndexOptions(self)

525

options_line = stream.readline()

526

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

527

raise errors.BadIndexOptions(self)

528

try:

529

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

530

except ValueError:

531

raise errors.BadIndexOptions(self)

532

options_line = stream.readline()

533

if not options_line.startswith(_OPTION_LEN):

534

raise errors.BadIndexOptions(self)

535

try:

536

self._key_count = int(options_line[len(_OPTION_LEN):-1])

537

except ValueError:

538

raise errors.BadIndexOptions(self)

539

540

def _resolve_references(self, references):

541

"""Return the resolved key references for references.

542

543

References are resolved by looking up the location of the key in the

544

_keys_by_offset map and substituting the key name, preserving ordering.

545

546

:param references: An iterable of iterables of key locations. e.g.

547

[[123, 456], [123]]

548

:return: A tuple of tuples of keys.

549

"""

550

node_refs = []

551

for ref_list in references:

552

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

553

return tuple(node_refs)

554

555

def _find_index(self, range_map, key):

556

"""Helper for the _parsed_*_index calls.

557

558

Given a range map - [(start, end), ...], finds the index of the range

559

in the map for key if it is in the map, and if it is not there, the

560

immediately preceeding range in the map.

561

"""

562

result = bisect_right(range_map, key) - 1

563

if result + 1 < len(range_map):

564

# check the border condition, it may be in result + 1

565

if range_map[result + 1][0] == key[0]:

566

return result + 1

567

return result

568

569

def _parsed_byte_index(self, offset):

570

"""Return the index of the entry immediately before offset.

571

572

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

573

there is one unparsed byte (the 11th, addressed as[10]). then:

574

asking for 0 will return 0

575

asking for 10 will return 0

576

asking for 11 will return 1

577

asking for 12 will return 1

578

"""

579

key = (offset, 0)

580

return self._find_index(self._parsed_byte_map, key)

581

582

def _parsed_key_index(self, key):

583

"""Return the index of the entry immediately before key.

584

585

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

586

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

587

have been parsed, then:

588

asking for '' will return 0

589

asking for 'a' will return 0

590

asking for 'b' will return 1

591

asking for 'e' will return 1

592

"""

593

search_key = (key, None)

594

return self._find_index(self._parsed_key_map, search_key)

595

596

def _is_parsed(self, offset):

597

"""Returns True if offset has been parsed."""

598

index = self._parsed_byte_index(offset)

599

if index == len(self._parsed_byte_map):

600

return offset < self._parsed_byte_map[index - 1][1]

601

start, end = self._parsed_byte_map[index]

602

return offset >= start and offset < end

603

604

def _iter_entries_from_total_buffer(self, keys):

605

"""Iterate over keys when the entire index is parsed."""

606

keys = keys.intersection(self._keys)

607

if self.node_ref_lists:

608

for key in keys:

609

value, node_refs = self._nodes[key]

610

yield self, key, value, node_refs

611

else:

612

for key in keys:

613

yield self, key, self._nodes[key]

614

615

def iter_entries(self, keys):

616

"""Iterate over keys within the index.

617

618

:param keys: An iterable providing the keys to be retrieved.

619

:return: An iterable as per iter_all_entries, but restricted to the

620

keys supplied. No additional keys will be returned, and every

621

key supplied that is in the index will be returned.

622

"""

623

keys = set(keys)

624

if not keys:

625

return []

626

if self._size is None and self._nodes is None:

627

self._buffer_all()

628

629

# We fit about 20 keys per minimum-read (4K), so if we are looking for

630

# more than 1/20th of the index its likely (assuming homogenous key

631

# spread) that we'll read the entire index. If we're going to do that,

632

# buffer the whole thing. A better analysis might take key spread into

633

# account - but B+Tree indices are better anyway.

634

# We could look at all data read, and use a threshold there, which will

635

# trigger on ancestry walks, but that is not yet fully mapped out.

636

if self._nodes is None and len(keys) * 20 > self.key_count():

637

self._buffer_all()

638

if self._nodes is not None:

639

return self._iter_entries_from_total_buffer(keys)

640

else:

641

return (result[1] for result in bisect_multi_bytes(

642

self._lookup_keys_via_location, self._size, keys))

643

644

def iter_entries_prefix(self, keys):

645

"""Iterate over keys within the index using prefix matching.

646

647

Prefix matching is applied within the tuple of a key, not to within

648

the bytestring of each key element. e.g. if you have the keys ('foo',

649

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

650

only the former key is returned.

651

652

WARNING: Note that this method currently causes a full index parse

653

unconditionally (which is reasonably appropriate as it is a means for

654

thunking many small indices into one larger one and still supplies

655

iter_all_entries at the thunk layer).

656

657

:param keys: An iterable providing the key prefixes to be retrieved.

658

Each key prefix takes the form of a tuple the length of a key, but

659

with the last N elements 'None' rather than a regular bytestring.

660

The first element cannot be 'None'.

661

:return: An iterable as per iter_all_entries, but restricted to the

662

keys with a matching prefix to those supplied. No additional keys

663

will be returned, and every match that is in the index will be

664

returned.

665

"""

666

keys = set(keys)

667

if not keys:

668

return

669

# load data - also finds key lengths

670

if self._nodes is None:

671

self._buffer_all()

672

if self._key_length == 1:

673

for key in keys:

674

# sanity check

675

if key[0] is None:

676

raise errors.BadIndexKey(key)

677

if len(key) != self._key_length:

678

raise errors.BadIndexKey(key)

679

if self.node_ref_lists:

680

value, node_refs = self._nodes[key]

681

yield self, key, value, node_refs

682

else:

683

yield self, key, self._nodes[key]

684

return

685

nodes_by_key = self._get_nodes_by_key()

686

for key in keys:

687

# sanity check

688

if key[0] is None:

689

raise errors.BadIndexKey(key)

690

if len(key) != self._key_length:

691

raise errors.BadIndexKey(key)

692

# find what it refers to:

693

key_dict = nodes_by_key

694

elements = list(key)

695

# find the subdict whose contents should be returned.

696

try:

697

while len(elements) and elements[0] is not None:

698

key_dict = key_dict[elements[0]]

699

elements.pop(0)

700

except KeyError:

701

# a non-existant lookup.

702

continue

703

if len(elements):

704

dicts = [key_dict]

705

while dicts:

706

key_dict = dicts.pop(-1)

707

# can't be empty or would not exist

708

item, value = key_dict.iteritems().next()

709

if type(value) == dict:

710

# push keys

711

dicts.extend(key_dict.itervalues())

712

else:

713

# yield keys

714

for value in key_dict.itervalues():

715

# each value is the key:value:node refs tuple

716

# ready to yield.

717

yield (self, ) + value

718

else:

719

# the last thing looked up was a terminal element

720

yield (self, ) + key_dict

721

722

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

723

"""See BTreeIndex._find_ancestors."""

724

# The api can be implemented as a trivial overlay on top of

725

# iter_entries, it is not an efficient implementation, but it at least

726

# gets the job done.

727

found_keys = set()

728

search_keys = set()

729

for index, key, value, refs in self.iter_entries(keys):

730

parent_keys = refs[ref_list_num]

731

found_keys.add(key)

732

parent_map[key] = parent_keys

733

search_keys.update(parent_keys)

734

# Figure out what, if anything, was missing

735

missing_keys.update(set(keys).difference(found_keys))

736

search_keys = search_keys.difference(parent_map)

737

return search_keys

738

739

def key_count(self):

740

"""Return an estimate of the number of keys in this index.

741

742

For GraphIndex the estimate is exact.

743

"""

744

if self._key_count is None:

745

self._read_and_parse([_HEADER_READV])

746

return self._key_count

747

748

def _lookup_keys_via_location(self, location_keys):

749

"""Public interface for implementing bisection.

750

751

If _buffer_all has been called, then all the data for the index is in

752

memory, and this method should not be called, as it uses a separate

753

cache because it cannot pre-resolve all indices, which buffer_all does

754

for performance.

755

756

:param location_keys: A list of location(byte offset), key tuples.

757

:return: A list of (location_key, result) tuples as expected by

758

bzrlib.bisect_multi.bisect_multi_bytes.

759

"""

760

# Possible improvements:

761

# - only bisect lookup each key once

762

# - sort the keys first, and use that to reduce the bisection window

763

# -----

764

# this progresses in three parts:

765

# read data

766

# parse it

767

# attempt to answer the question from the now in memory data.

768

# build the readv request

769

# for each location, ask for 800 bytes - much more than rows we've seen

770

# anywhere.

771

readv_ranges = []

772

for location, key in location_keys:

773

# can we answer from cache?

774

if self._bisect_nodes and key in self._bisect_nodes:

775

# We have the key parsed.

776

continue

777

index = self._parsed_key_index(key)

778

if (len(self._parsed_key_map) and

779

self._parsed_key_map[index][0] <= key and

780

(self._parsed_key_map[index][1] >= key or

781

# end of the file has been parsed

782

self._parsed_byte_map[index][1] == self._size)):

783

# the key has been parsed, so no lookup is needed even if its

784

# not present.

785

continue

786

# - if we have examined this part of the file already - yes

787

index = self._parsed_byte_index(location)

788

if (len(self._parsed_byte_map) and

789

self._parsed_byte_map[index][0] <= location and

790

self._parsed_byte_map[index][1] > location):

791

# the byte region has been parsed, so no read is needed.

792

continue

793

length = 800

794

if location + length > self._size:

795

length = self._size - location

796

# todo, trim out parsed locations.

797

if length > 0:

798

readv_ranges.append((location, length))

799

# read the header if needed

800

if self._bisect_nodes is None:

801

readv_ranges.append(_HEADER_READV)

802

self._read_and_parse(readv_ranges)

803

result = []

804

if self._nodes is not None:

805

# _read_and_parse triggered a _buffer_all because we requested the

806

# whole data range

807

for location, key in location_keys:

808

if key not in self._nodes: # not present

809

result.append(((location, key), False))

810

elif self.node_ref_lists:

811

value, refs = self._nodes[key]

812

result.append(((location, key),

813

(self, key, value, refs)))

814

else:

815

result.append(((location, key),

816

(self, key, self._nodes[key])))

817

return result

818

# generate results:

819

# - figure out <, >, missing, present

820

# - result present references so we can return them.

821

# keys that we cannot answer until we resolve references

822

pending_references = []

823

pending_locations = set()

824

for location, key in location_keys:

825

# can we answer from cache?

826

if key in self._bisect_nodes:

827

# the key has been parsed, so no lookup is needed

828

if self.node_ref_lists:

829

# the references may not have been all parsed.

830

value, refs = self._bisect_nodes[key]

831

wanted_locations = []

832

for ref_list in refs:

833

for ref in ref_list:

834

if ref not in self._keys_by_offset:

835

wanted_locations.append(ref)

836

if wanted_locations:

837

pending_locations.update(wanted_locations)

838

pending_references.append((location, key))

839

continue

840

result.append(((location, key), (self, key,

841

value, self._resolve_references(refs))))

842

else:

843

result.append(((location, key),

844

(self, key, self._bisect_nodes[key])))

845

continue

846

else:

847

# has the region the key should be in, been parsed?

848

index = self._parsed_key_index(key)

849

if (self._parsed_key_map[index][0] <= key and

850

(self._parsed_key_map[index][1] >= key or

851

# end of the file has been parsed

852

self._parsed_byte_map[index][1] == self._size)):

853

result.append(((location, key), False))

854

continue

855

# no, is the key above or below the probed location:

856

# get the range of the probed & parsed location

857

index = self._parsed_byte_index(location)

858

# if the key is below the start of the range, its below

859

if key < self._parsed_key_map[index][0]:

860

direction = -1

861

else:

862

direction = +1

863

result.append(((location, key), direction))

864

readv_ranges = []

865

# lookup data to resolve references

866

for location in pending_locations:

867

length = 800

868

if location + length > self._size:

869

length = self._size - location

870

# TODO: trim out parsed locations (e.g. if the 800 is into the

871

# parsed region trim it, and dont use the adjust_for_latency

872

# facility)

873

if length > 0:

874

readv_ranges.append((location, length))

875

self._read_and_parse(readv_ranges)

876

if self._nodes is not None:

877

# The _read_and_parse triggered a _buffer_all, grab the data and

878

# return it

879

for location, key in pending_references:

880

value, refs = self._nodes[key]

881

result.append(((location, key), (self, key, value, refs)))

882

return result

883

for location, key in pending_references:

884

# answer key references we had to look-up-late.

885

value, refs = self._bisect_nodes[key]

886

result.append(((location, key), (self, key,

887

value, self._resolve_references(refs))))

888

return result

889

890

def _parse_header_from_bytes(self, bytes):

891

"""Parse the header from a region of bytes.

892

893

:param bytes: The data to parse.

894

:return: An offset, data tuple such as readv yields, for the unparsed

895

data. (which may length 0).

896

"""

897

signature = bytes[0:len(self._signature())]

898

if not signature == self._signature():

899

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

900

lines = bytes[len(self._signature()):].splitlines()

901

options_line = lines[0]

902

if not options_line.startswith(_OPTION_NODE_REFS):

903

raise errors.BadIndexOptions(self)

904

try:

905

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

906

except ValueError:

907

raise errors.BadIndexOptions(self)

908

options_line = lines[1]

909

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

910

raise errors.BadIndexOptions(self)

911

try:

912

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

913

except ValueError:

914

raise errors.BadIndexOptions(self)

915

options_line = lines[2]

916

if not options_line.startswith(_OPTION_LEN):

917

raise errors.BadIndexOptions(self)

918

try:

919

self._key_count = int(options_line[len(_OPTION_LEN):])

920

except ValueError:

921

raise errors.BadIndexOptions(self)

922

# calculate the bytes we have processed

923

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

924

len(lines[2]) + 3)

925

self._parsed_bytes(0, None, header_end, None)

926

# setup parsing state

927

self._expected_elements = 3 + self._key_length

928

# raw data keyed by offset

929

self._keys_by_offset = {}

930

# keys with the value and node references

931

self._bisect_nodes = {}

932

return header_end, bytes[header_end:]

933

934

def _parse_region(self, offset, data):

935

"""Parse node data returned from a readv operation.

936

937

:param offset: The byte offset the data starts at.

938

:param data: The data to parse.

939

"""

940

# trim the data.

941

# end first:

942

end = offset + len(data)

943

high_parsed = offset

944

while True:

945

# Trivial test - if the current index's end is within the

946

# low-matching parsed range, we're done.

947

index = self._parsed_byte_index(high_parsed)

948

if end < self._parsed_byte_map[index][1]:

949

return

950

# print "[%d:%d]" % (offset, end), \

951

# self._parsed_byte_map[index:index + 2]

952

high_parsed, last_segment = self._parse_segment(

953

offset, data, end, index)

954

if last_segment:

955

return

956

957

def _parse_segment(self, offset, data, end, index):

958

"""Parse one segment of data.

959

960

:param offset: Where 'data' begins in the file.

961

:param data: Some data to parse a segment of.

962

:param end: Where data ends

963

:param index: The current index into the parsed bytes map.

964

:return: True if the parsed segment is the last possible one in the

965

range of data.

966

:return: high_parsed_byte, last_segment.

967

high_parsed_byte is the location of the highest parsed byte in this

968

segment, last_segment is True if the parsed segment is the last

969

possible one in the data block.

970

"""

971

# default is to use all data

972

trim_end = None

973

# accomodate overlap with data before this.

974

if offset < self._parsed_byte_map[index][1]:

975

# overlaps the lower parsed region

976

# skip the parsed data

977

trim_start = self._parsed_byte_map[index][1] - offset

978

# don't trim the start for \n

979

start_adjacent = True

980

elif offset == self._parsed_byte_map[index][1]:

981

# abuts the lower parsed region

982

# use all data

983

trim_start = None

984

# do not trim anything

985

start_adjacent = True

986

else:

987

# does not overlap the lower parsed region

988

# use all data

989

trim_start = None

990

# but trim the leading \n

991

start_adjacent = False

992

if end == self._size:

993

# lines up to the end of all data:

994

# use it all

995

trim_end = None

996

# do not strip to the last \n

997

end_adjacent = True

998

last_segment = True

999

elif index + 1 == len(self._parsed_byte_map):

1000

# at the end of the parsed data

1001

# use it all

1002

trim_end = None

1003

# but strip to the last \n

1004

end_adjacent = False

1005

last_segment = True

1006

elif end == self._parsed_byte_map[index + 1][0]:

1007

# buts up against the next parsed region

1008

# use it all

1009

trim_end = None

1010

# do not strip to the last \n

1011

end_adjacent = True

1012

last_segment = True

1013

elif end > self._parsed_byte_map[index + 1][0]:

1014

# overlaps into the next parsed region

1015

# only consider the unparsed data

1016

trim_end = self._parsed_byte_map[index + 1][0] - offset

1017

# do not strip to the last \n as we know its an entire record

1018

end_adjacent = True

1019

last_segment = end < self._parsed_byte_map[index + 1][1]

1020

else:

1021

# does not overlap into the next region

1022

# use it all

1023

trim_end = None

1024

# but strip to the last \n

1025

end_adjacent = False

1026

last_segment = True

1027

# now find bytes to discard if needed

1028

if not start_adjacent:

1029

# work around python bug in rfind

1030

if trim_start is None:

1031

trim_start = data.find('\n') + 1

1032

else:

1033

trim_start = data.find('\n', trim_start) + 1

1034

if not (trim_start != 0):

1035

raise AssertionError('no \n was present')

1036

# print 'removing start', offset, trim_start, repr(data[:trim_start])

1037

if not end_adjacent:

1038

# work around python bug in rfind

1039

if trim_end is None:

1040

trim_end = data.rfind('\n') + 1

1041

else:

1042

trim_end = data.rfind('\n', None, trim_end) + 1

1043

if not (trim_end != 0):

1044

raise AssertionError('no \n was present')

1045

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1046

# adjust offset and data to the parseable data.

1047

trimmed_data = data[trim_start:trim_end]

1048

if not (trimmed_data):

1049

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1050

% (trim_start, trim_end, offset, offset + len(data)))

1051

if trim_start:

1052

offset += trim_start

1053

# print "parsing", repr(trimmed_data)

1054

# splitlines mangles the \r delimiters.. don't use it.

1055

lines = trimmed_data.split('\n')

1056

del lines[-1]

1057

pos = offset

1058

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1059

for key, value in nodes:

1060

self._bisect_nodes[key] = value

1061

self._parsed_bytes(offset, first_key,

1062

offset + len(trimmed_data), last_key)

1063

return offset + len(trimmed_data), last_segment

1064

1065

def _parse_lines(self, lines, pos):

1066

key = None

1067

first_key = None

1068

trailers = 0

1069

nodes = []

1070

for line in lines:

1071

if line == '':

1072

# must be at the end

1073

if self._size:

1074

if not (self._size == pos + 1):

1075

raise AssertionError("%s %s" % (self._size, pos))

1076

trailers += 1

1077

continue

1078

elements = line.split('\0')

1079

if len(elements) != self._expected_elements:

1080

raise errors.BadIndexData(self)

1081

# keys are tuples. Each element is a string that may occur many

1082

# times, so we intern them to save space. AB, RC, 200807

1083

key = tuple([intern(element) for element in elements[:self._key_length]])

1084

if first_key is None:

1085

first_key = key

1086

absent, references, value = elements[-3:]

1087

ref_lists = []

1088

for ref_string in references.split('\t'):

1089

ref_lists.append(tuple([

1090

int(ref) for ref in ref_string.split('\r') if ref

1091

]))

1092

ref_lists = tuple(ref_lists)

1093

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1094

pos += len(line) + 1 # +1 for the \n

1095

if absent:

1096

continue

1097

if self.node_ref_lists:

1098

node_value = (value, ref_lists)

1099

else:

1100

node_value = value

1101

nodes.append((key, node_value))

1102

# print "parsed ", key

1103

return first_key, key, nodes, trailers

1104

1105

def _parsed_bytes(self, start, start_key, end, end_key):

1106

"""Mark the bytes from start to end as parsed.

1107

1108

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1109

1) as parsed.

1110

1111

:param start: The start of the parsed region.

1112

:param end: The end of the parsed region.

1113

"""

1114

index = self._parsed_byte_index(start)

1115

new_value = (start, end)

1116

new_key = (start_key, end_key)

1117

if index == -1:

1118

# first range parsed is always the beginning.

1119

self._parsed_byte_map.insert(index, new_value)

1120

self._parsed_key_map.insert(index, new_key)

1121

return

1122

# four cases:

1123

# new region

1124

# extend lower region

1125

# extend higher region

1126

# combine two regions

1127

if (index + 1 < len(self._parsed_byte_map) and

1128

self._parsed_byte_map[index][1] == start and

1129

self._parsed_byte_map[index + 1][0] == end):

1130

# combine two regions

1131

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1132

self._parsed_byte_map[index + 1][1])

1133

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1134

self._parsed_key_map[index + 1][1])

1135

del self._parsed_byte_map[index + 1]

1136

del self._parsed_key_map[index + 1]

1137

elif self._parsed_byte_map[index][1] == start:

1138

# extend the lower entry

1139

self._parsed_byte_map[index] = (

1140

self._parsed_byte_map[index][0], end)

1141

self._parsed_key_map[index] = (

1142

self._parsed_key_map[index][0], end_key)

1143

elif (index + 1 < len(self._parsed_byte_map) and

1144

self._parsed_byte_map[index + 1][0] == end):

1145

# extend the higher entry

1146

self._parsed_byte_map[index + 1] = (

1147

start, self._parsed_byte_map[index + 1][1])

1148

self._parsed_key_map[index + 1] = (

1149

start_key, self._parsed_key_map[index + 1][1])

1150

else:

1151

# new entry

1152

self._parsed_byte_map.insert(index + 1, new_value)

1153

self._parsed_key_map.insert(index + 1, new_key)

1154

1155

def _read_and_parse(self, readv_ranges):

1156

"""Read the the ranges and parse the resulting data.

1157

1158

:param readv_ranges: A prepared readv range list.

1159

"""

1160

if not readv_ranges:

1161

return

1162

if self._nodes is None and self._bytes_read * 2 >= self._size:

1163

# We've already read more than 50% of the file and we are about to

1164

# request more data, just _buffer_all() and be done

1165

self._buffer_all()

1166

return

1167

1168

readv_data = self._transport.readv(self._name, readv_ranges, True,

1169

self._size)

1170

# parse

1171

for offset, data in readv_data:

1172

self._bytes_read += len(data)

1173

if offset == 0 and len(data) == self._size:

1174

# We read the whole range, most likely because the

1175

# Transport upcast our readv ranges into one long request

1176

# for enough total data to grab the whole index.

1177

self._buffer_all(StringIO(data))

1178

return

1179

if self._bisect_nodes is None:

1180

# this must be the start

1181

if not (offset == 0):

1182

raise AssertionError()

1183

offset, data = self._parse_header_from_bytes(data)

1184

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1185

self._parse_region(offset, data)

1186

1187

def _signature(self):

1188

"""The file signature for this index type."""

1189

return _SIGNATURE

1190

1191

def validate(self):

1192

"""Validate that everything in the index can be accessed."""

1193

# iter_all validates completely at the moment, so just do that.

1194

for node in self.iter_all_entries():

1195

pass

1196

1197

1198

class CombinedGraphIndex(object):

1199

"""A GraphIndex made up from smaller GraphIndices.

1200

1201

The backing indices must implement GraphIndex, and are presumed to be

1202

static data.

1203

1204

Queries against the combined index will be made against the first index,

1205

and then the second and so on. The order of index's can thus influence

1206

performance significantly. For example, if one index is on local disk and a

1207

second on a remote server, the local disk index should be before the other

1208

in the index list.

1209

"""

1210

1211

def __init__(self, indices, reload_func=None):

1212

"""Create a CombinedGraphIndex backed by indices.

1213

1214

:param indices: An ordered list of indices to query for data.

1215

:param reload_func: A function to call if we find we are missing an

1216

index. Should have the form reload_func() => True/False to indicate

1217

if reloading actually changed anything.

1218

"""

1219

self._indices = indices

1220

self._reload_func = reload_func

1221

1222

def __repr__(self):

1223

return "%s(%s)" % (

1224

self.__class__.__name__,

1225

', '.join(map(repr, self._indices)))

1226

1227

def get_parent_map(self, keys):

1228

"""See graph.StackedParentsProvider.get_parent_map"""

1229

search_keys = set(keys)

1230

if NULL_REVISION in search_keys:

1231

search_keys.discard(NULL_REVISION)

1232

found_parents = {NULL_REVISION:[]}

1233

else:

1234

found_parents = {}

1235

for index, key, value, refs in self.iter_entries(search_keys):

1236

parents = refs[0]

1237

if not parents:

1238

parents = (NULL_REVISION,)

1239

found_parents[key] = parents

1240

return found_parents

1241

1242

has_key = _has_key_from_parent_map

1243

1244

def insert_index(self, pos, index):

1245

"""Insert a new index in the list of indices to query.

1246

1247

:param pos: The position to insert the index.

1248

:param index: The index to insert.

1249

"""

1250

self._indices.insert(pos, index)

1251

1252

def iter_all_entries(self):

1253

"""Iterate over all keys within the index

1254

1255

Duplicate keys across child indices are presumed to have the same

1256

value and are only reported once.

1257

1258

:return: An iterable of (index, key, reference_lists, value).

1259

There is no defined order for the result iteration - it will be in

1260

the most efficient order for the index.

1261

"""

1262

seen_keys = set()

1263

while True:

1264

try:

1265

for index in self._indices:

1266

for node in index.iter_all_entries():

1267

if node[1] not in seen_keys:

1268

yield node

1269

seen_keys.add(node[1])

1270

return

1271

except errors.NoSuchFile:

1272

self._reload_or_raise()

1273

1274

def iter_entries(self, keys):

1275

"""Iterate over keys within the index.

1276

1277

Duplicate keys across child indices are presumed to have the same

1278

value and are only reported once.

1279

1280

:param keys: An iterable providing the keys to be retrieved.

1281

:return: An iterable of (index, key, reference_lists, value). There is no

1282

defined order for the result iteration - it will be in the most

1283

efficient order for the index.

1284

"""

1285

keys = set(keys)

1286

while True:

1287

try:

1288

for index in self._indices:

1289

if not keys:

1290

return

1291

for node in index.iter_entries(keys):

1292

keys.remove(node[1])

1293

yield node

1294

return

1295

except errors.NoSuchFile:

1296

self._reload_or_raise()

1297

1298

def iter_entries_prefix(self, keys):

1299

"""Iterate over keys within the index using prefix matching.

1300

1301

Duplicate keys across child indices are presumed to have the same

1302

value and are only reported once.

1303

1304

Prefix matching is applied within the tuple of a key, not to within

1305

the bytestring of each key element. e.g. if you have the keys ('foo',

1306

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1307

only the former key is returned.

1308

1309

:param keys: An iterable providing the key prefixes to be retrieved.

1310

Each key prefix takes the form of a tuple the length of a key, but

1311

with the last N elements 'None' rather than a regular bytestring.

1312

The first element cannot be 'None'.

1313

:return: An iterable as per iter_all_entries, but restricted to the

1314

keys with a matching prefix to those supplied. No additional keys

1315

will be returned, and every match that is in the index will be

1316

returned.

1317

"""

1318

keys = set(keys)

1319

if not keys:

1320

return

1321

seen_keys = set()

1322

while True:

1323

try:

1324

for index in self._indices:

1325

for node in index.iter_entries_prefix(keys):

1326

if node[1] in seen_keys:

1327

continue

1328

seen_keys.add(node[1])

1329

yield node

1330

return

1331

except errors.NoSuchFile:

1332

self._reload_or_raise()

1333

1334

def find_ancestry(self, keys, ref_list_num):

1335

"""Find the complete ancestry for the given set of keys.

1336

1337

Note that this is a whole-ancestry request, so it should be used

1338

sparingly.

1339

1340

:param keys: An iterable of keys to look for

1341

:param ref_list_num: The reference list which references the parents

1342

we care about.

1343

:return: (parent_map, missing_keys)

1344

"""

1345

missing_keys = set()

1346

parent_map = {}

1347

keys_to_lookup = set(keys)

1348

generation = 0

1349

while keys_to_lookup:

1350

# keys that *all* indexes claim are missing, stop searching them

1351

generation += 1

1352

all_index_missing = None

1353

# print 'gen\tidx\tsub\tn_keys\tn_pmap\tn_miss'

1354

# print '%4d\t\t\t%4d\t%5d\t%5d' % (generation, len(keys_to_lookup),

1355

# len(parent_map),

1356

# len(missing_keys))

1357

for index_idx, index in enumerate(self._indices):

1358

# TODO: we should probably be doing something with

1359

# 'missing_keys' since we've already determined that

1360

# those revisions have not been found anywhere

1361

index_missing_keys = set()

1362

# Find all of the ancestry we can from this index

1363

# keep looking until the search_keys set is empty, which means

1364

# things we didn't find should be in index_missing_keys

1365

search_keys = keys_to_lookup

1366

sub_generation = 0

1367

# print ' \t%2d\t\t%4d\t%5d\t%5d' % (

1368

# index_idx, len(search_keys),

1369

# len(parent_map), len(index_missing_keys))

1370

while search_keys:

1371

sub_generation += 1

1372

# TODO: ref_list_num should really be a parameter, since

1373

# CombinedGraphIndex does not know what the ref lists

1374

# mean.

1375

search_keys = index._find_ancestors(search_keys,

1376

ref_list_num, parent_map, index_missing_keys)

1377

# print ' \t \t%2d\t%4d\t%5d\t%5d' % (

1378

# sub_generation, len(search_keys),

1379

# len(parent_map), len(index_missing_keys))

1380

# Now set whatever was missing to be searched in the next index

1381

keys_to_lookup = index_missing_keys

1382

if all_index_missing is None:

1383

all_index_missing = set(index_missing_keys)

1384

else:

1385

all_index_missing.intersection_update(index_missing_keys)

1386

if not keys_to_lookup:

1387

break

1388

if all_index_missing is None:

1389

# There were no indexes, so all search keys are 'missing'

1390

missing_keys.update(keys_to_lookup)

1391

keys_to_lookup = None

1392

else:

1393

missing_keys.update(all_index_missing)

1394

keys_to_lookup.difference_update(all_index_missing)

1395

return parent_map, missing_keys

1396

1397

def key_count(self):

1398

"""Return an estimate of the number of keys in this index.

1399

1400

For CombinedGraphIndex this is approximated by the sum of the keys of

1401

the child indices. As child indices may have duplicate keys this can

1402

have a maximum error of the number of child indices * largest number of

1403

keys in any index.

1404

"""

1405

while True:

1406

try:

1407

return sum((index.key_count() for index in self._indices), 0)

1408

except errors.NoSuchFile:

1409

self._reload_or_raise()

1410

1411

missing_keys = _missing_keys_from_parent_map

1412

1413

def _reload_or_raise(self):

1414

"""We just got a NoSuchFile exception.

1415

1416

Try to reload the indices, if it fails, just raise the current

1417

exception.

1418

"""

1419

if self._reload_func is None:

1420

raise

1421

exc_type, exc_value, exc_traceback = sys.exc_info()

1422

trace.mutter('Trying to reload after getting exception: %s',

1423

exc_value)

1424

if not self._reload_func():

1425

# We tried to reload, but nothing changed, so we fail anyway

1426

trace.mutter('_reload_func indicated nothing has changed.'

1427

' Raising original exception.')

1428

raise exc_type, exc_value, exc_traceback

1429

1430

def validate(self):

1431

"""Validate that everything in the index can be accessed."""

1432

while True:

1433

try:

1434

for index in self._indices:

1435

index.validate()

1436

return

1437

except errors.NoSuchFile:

1438

self._reload_or_raise()

1439

1440

1441

class InMemoryGraphIndex(GraphIndexBuilder):

1442

"""A GraphIndex which operates entirely out of memory and is mutable.

1443

1444

This is designed to allow the accumulation of GraphIndex entries during a

1445

single write operation, where the accumulated entries need to be immediately

1446

available - for example via a CombinedGraphIndex.

1447

"""

1448

1449

def add_nodes(self, nodes):

1450

"""Add nodes to the index.

1451

1452

:param nodes: An iterable of (key, node_refs, value) entries to add.

1453

"""

1454

if self.reference_lists:

1455

for (key, value, node_refs) in nodes:

1456

self.add_node(key, value, node_refs)

1457

else:

1458

for (key, value) in nodes:

1459

self.add_node(key, value)

1460

1461

def iter_all_entries(self):

1462

"""Iterate over all keys within the index

1463

1464

:return: An iterable of (index, key, reference_lists, value). There is no

1465

defined order for the result iteration - it will be in the most

1466

efficient order for the index (in this case dictionary hash order).

1467

"""

1468

if 'evil' in debug.debug_flags:

1469

trace.mutter_callsite(3,

1470

"iter_all_entries scales with size of history.")

1471

if self.reference_lists:

1472

for key, (absent, references, value) in self._nodes.iteritems():

1473

if not absent:

1474

yield self, key, value, references

1475

else:

1476

for key, (absent, references, value) in self._nodes.iteritems():

1477

if not absent:

1478

yield self, key, value

1479

1480

def iter_entries(self, keys):

1481

"""Iterate over keys within the index.

1482

1483

:param keys: An iterable providing the keys to be retrieved.

1484

:return: An iterable of (index, key, value, reference_lists). There is no

1485

defined order for the result iteration - it will be in the most

1486

efficient order for the index (keys iteration order in this case).

1487

"""

1488

keys = set(keys)

1489

if self.reference_lists:

1490

for key in keys.intersection(self._keys):

1491

node = self._nodes[key]

1492

if not node[0]:

1493

yield self, key, node[2], node[1]

1494

else:

1495

for key in keys.intersection(self._keys):

1496

node = self._nodes[key]

1497

if not node[0]:

1498

yield self, key, node[2]

1499

1500

def iter_entries_prefix(self, keys):

1501

"""Iterate over keys within the index using prefix matching.

1502

1503

Prefix matching is applied within the tuple of a key, not to within

1504

the bytestring of each key element. e.g. if you have the keys ('foo',

1505

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1506

only the former key is returned.

1507

1508

:param keys: An iterable providing the key prefixes to be retrieved.

1509

Each key prefix takes the form of a tuple the length of a key, but

1510

with the last N elements 'None' rather than a regular bytestring.

1511

The first element cannot be 'None'.

1512

:return: An iterable as per iter_all_entries, but restricted to the

1513

keys with a matching prefix to those supplied. No additional keys

1514

will be returned, and every match that is in the index will be

1515

returned.

1516

"""

1517

# XXX: To much duplication with the GraphIndex class; consider finding

1518

# a good place to pull out the actual common logic.

1519

keys = set(keys)

1520

if not keys:

1521

return

1522

if self._key_length == 1:

1523

for key in keys:

1524

# sanity check

1525

if key[0] is None:

1526

raise errors.BadIndexKey(key)

1527

if len(key) != self._key_length:

1528

raise errors.BadIndexKey(key)

1529

node = self._nodes[key]

1530

if node[0]:

1531

continue

1532

if self.reference_lists:

1533

yield self, key, node[2], node[1]

1534

else:

1535

yield self, key, node[2]

1536

return

1537

nodes_by_key = self._get_nodes_by_key()

1538

for key in keys:

1539

# sanity check

1540

if key[0] is None:

1541

raise errors.BadIndexKey(key)

1542

if len(key) != self._key_length:

1543

raise errors.BadIndexKey(key)

1544

# find what it refers to:

1545

key_dict = nodes_by_key

1546

elements = list(key)

1547

# find the subdict to return

1548

try:

1549

while len(elements) and elements[0] is not None:

1550

key_dict = key_dict[elements[0]]

1551

elements.pop(0)

1552

except KeyError:

1553

# a non-existant lookup.

1554

continue

1555

if len(elements):

1556

dicts = [key_dict]

1557

while dicts:

1558

key_dict = dicts.pop(-1)

1559

# can't be empty or would not exist

1560

item, value = key_dict.iteritems().next()

1561

if type(value) == dict:

1562

# push keys

1563

dicts.extend(key_dict.itervalues())

1564

else:

1565

# yield keys

1566

for value in key_dict.itervalues():

1567

yield (self, ) + value

1568

else:

1569

yield (self, ) + key_dict

1570

1571

def key_count(self):

1572

"""Return an estimate of the number of keys in this index.

1573

1574

For InMemoryGraphIndex the estimate is exact.

1575

"""

1576

return len(self._keys)

1577

1578

def validate(self):

1579

"""In memory index's have no known corruption at the moment."""

1580

1581

1582

class GraphIndexPrefixAdapter(object):

1583

"""An adapter between GraphIndex with different key lengths.

1584

1585

Queries against this will emit queries against the adapted Graph with the

1586

prefix added, queries for all items use iter_entries_prefix. The returned

1587

nodes will have their keys and node references adjusted to remove the

1588

prefix. Finally, an add_nodes_callback can be supplied - when called the

1589

nodes and references being added will have prefix prepended.

1590

"""

1591

1592

def __init__(self, adapted, prefix, missing_key_length,

1593

add_nodes_callback=None):

1594

"""Construct an adapter against adapted with prefix."""

1595

self.adapted = adapted

1596

self.prefix_key = prefix + (None,)*missing_key_length

1597

self.prefix = prefix

1598

self.prefix_len = len(prefix)

1599

self.add_nodes_callback = add_nodes_callback

1600

1601

def add_nodes(self, nodes):

1602

"""Add nodes to the index.

1603

1604

:param nodes: An iterable of (key, node_refs, value) entries to add.

1605

"""

1606

# save nodes in case its an iterator

1607

nodes = tuple(nodes)

1608

translated_nodes = []

1609

try:

1610

# Add prefix_key to each reference node_refs is a tuple of tuples,

1611

# so split it apart, and add prefix_key to the internal reference

1612

for (key, value, node_refs) in nodes:

1613

adjusted_references = (

1614

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1615

for ref_list in node_refs))

1616

translated_nodes.append((self.prefix + key, value,

1617

adjusted_references))

1618

except ValueError:

1619

# XXX: TODO add an explicit interface for getting the reference list

1620

# status, to handle this bit of user-friendliness in the API more

1621

# explicitly.

1622

for (key, value) in nodes:

1623

translated_nodes.append((self.prefix + key, value))

1624

self.add_nodes_callback(translated_nodes)

1625

1626

def add_node(self, key, value, references=()):

1627

"""Add a node to the index.

1628

1629

:param key: The key. keys are non-empty tuples containing

1630

as many whitespace-free utf8 bytestrings as the key length

1631

defined for this index.

1632

:param references: An iterable of iterables of keys. Each is a

1633

reference to another key.

1634

:param value: The value to associate with the key. It may be any

1635

bytes as long as it does not contain \0 or \n.

1636

"""

1637

self.add_nodes(((key, value, references), ))

1638

1639

def _strip_prefix(self, an_iter):

1640

"""Strip prefix data from nodes and return it."""

1641

for node in an_iter:

1642

# cross checks

1643

if node[1][:self.prefix_len] != self.prefix:

1644

raise errors.BadIndexData(self)

1645

for ref_list in node[3]:

1646

for ref_node in ref_list:

1647

if ref_node[:self.prefix_len] != self.prefix:

1648

raise errors.BadIndexData(self)

1649

yield node[0], node[1][self.prefix_len:], node[2], (

1650

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1651

for ref_list in node[3]))

1652

1653

def iter_all_entries(self):

1654

"""Iterate over all keys within the index

1655

1656

iter_all_entries is implemented against the adapted index using

1657

iter_entries_prefix.

1658

1659

:return: An iterable of (index, key, reference_lists, value). There is no

1660

defined order for the result iteration - it will be in the most

1661

efficient order for the index (in this case dictionary hash order).

1662

"""

1663

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1664

1665

def iter_entries(self, keys):

1666

"""Iterate over keys within the index.

1667

1668

:param keys: An iterable providing the keys to be retrieved.

1669

:return: An iterable of (index, key, value, reference_lists). There is no

1670

defined order for the result iteration - it will be in the most

1671

efficient order for the index (keys iteration order in this case).

1672

"""

1673

return self._strip_prefix(self.adapted.iter_entries(

1674

self.prefix + key for key in keys))

1675

1676

def iter_entries_prefix(self, keys):

1677

"""Iterate over keys within the index using prefix matching.

1678

1679

Prefix matching is applied within the tuple of a key, not to within

1680

the bytestring of each key element. e.g. if you have the keys ('foo',

1681

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1682

only the former key is returned.

1683

1684

:param keys: An iterable providing the key prefixes to be retrieved.

1685

Each key prefix takes the form of a tuple the length of a key, but

1686

with the last N elements 'None' rather than a regular bytestring.

1687

The first element cannot be 'None'.

1688

:return: An iterable as per iter_all_entries, but restricted to the

1689

keys with a matching prefix to those supplied. No additional keys

1690

will be returned, and every match that is in the index will be

1691

returned.

1692

"""

1693

return self._strip_prefix(self.adapted.iter_entries_prefix(

1694

self.prefix + key for key in keys))

1695

1696

def key_count(self):

1697

"""Return an estimate of the number of keys in this index.

1698

1699

For GraphIndexPrefixAdapter this is relatively expensive - key

1700

iteration with the prefix is done.

1701

"""

1702

return len(list(self.iter_all_entries()))

1703

1704

def validate(self):

1705

"""Call the adapted's validate."""

1706

self.adapted.validate()

Older »