/brz/remove-bazaar : revision 4679.8.8

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: John Arbash Meinel
Date: 2009-10-12 22:04:23 UTC
mto: This revision was merged to the branch mainline in revision 4749.
Revision ID: john@arbash-meinel.com-20091012220423-zhf08uf178gwqwog

I think I know where things are going wrong, at least with tuple concatenation.

However, of the 800+ failing tests on PQM, I can't reproduce the failures here (yet)

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/history2revfiles.py

tools/http_client.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

dir.py

dulwich

dulwich/.bzrignore

dulwich/COPYING

dulwich/Makefile

dulwich/README

dulwich/bin

dulwich/bin/dul-daemon

dulwich/bin/dul-receive-pack

dulwich/bin/dul-upload-pack

dulwich/bin/dulwich

dulwich/docs

dulwich/docs/protocol.txt

dulwich/dulwich

dulwich/dulwich/__init__.py

dulwich/dulwich/client.py

dulwich/dulwich/commit.py

dulwich/dulwich/errors.py

dulwich/dulwich/objects.py

dulwich/dulwich/pack.py

dulwich/dulwich/protocol.py

dulwich/dulwich/repo.py

dulwich/dulwich/server.py

dulwich/dulwich/tests

dulwich/dulwich/tests/__init__.py

dulwich/dulwich/tests/data

dulwich/dulwich/tests/data/blobs

dulwich/dulwich/tests/data/blobs/6f670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/blobs/954a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/blobs/e69de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/commits

dulwich/dulwich/tests/data/commits/0d89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/commits/5dac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/commits/60dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/packs

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.idx

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.pack

dulwich/dulwich/tests/data/repos

dulwich/dulwich/tests/data/repos/a

dulwich/dulwich/tests/data/repos/a/.git

dulwich/dulwich/tests/data/repos/a/.git/HEAD

dulwich/dulwich/tests/data/repos/a/.git/index

dulwich/dulwich/tests/data/repos/a/.git/objects

dulwich/dulwich/tests/data/repos/a/.git/objects/2a

dulwich/dulwich/tests/data/repos/a/.git/objects/2a/72d929692c41d8554c07f6301757ba18a65d91

dulwich/dulwich/tests/data/repos/a/.git/objects/4e

dulwich/dulwich/tests/data/repos/a/.git/objects/4e/f30bbfe26431a69c3820d3a683df54d688f2ec

dulwich/dulwich/tests/data/repos/a/.git/objects/4f

dulwich/dulwich/tests/data/repos/a/.git/objects/4f/2e6529203aa6d44b5af6e3292c837ceda003f9

dulwich/dulwich/tests/data/repos/a/.git/objects/7d

dulwich/dulwich/tests/data/repos/a/.git/objects/7d/9a07d797595ef11344549b8d08198e48c15364

dulwich/dulwich/tests/data/repos/a/.git/objects/a2

dulwich/dulwich/tests/data/repos/a/.git/objects/a2/96d0bb611188cabb256919f36bc30117cca005

dulwich/dulwich/tests/data/repos/a/.git/objects/a9

dulwich/dulwich/tests/data/repos/a/.git/objects/a9/0fa2d900a17e99b433217e988c4eb4a2e9a097

dulwich/dulwich/tests/data/repos/a/.git/objects/ff

dulwich/dulwich/tests/data/repos/a/.git/objects/ff/d47d45845a8f6576491e1edb97e3fe6a850e7f

dulwich/dulwich/tests/data/repos/a/.git/objects/info

dulwich/dulwich/tests/data/repos/a/.git/objects/pack

dulwich/dulwich/tests/data/repos/a/.git/refs

dulwich/dulwich/tests/data/repos/a/.git/refs/heads

dulwich/dulwich/tests/data/repos/a/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/a/.git/refs/tags

dulwich/dulwich/tests/data/repos/a/a

dulwich/dulwich/tests/data/repos/a/b

dulwich/dulwich/tests/data/repos/a/c

dulwich/dulwich/tests/data/repos/ooo_merge

dulwich/dulwich/tests/data/repos/ooo_merge/.git

dulwich/dulwich/tests/data/repos/ooo_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/ooo_merge/.git/index

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38/74e9c60a6d149c44c928140f250d81e6381520

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76/01d7f6231db6a57f7bbb79ee52e4d462fd44d1

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2/a2766a2879c209ab1176e7e778b81ae422eeaa

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5/07291b64138b875c28e03469025b1ea20bc614

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9/e39b120c68182a4ba35349f832d0e4e61f485c

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb/5b0425c7ce46959bec94d54b9a157645e114f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/ooo_merge/a

dulwich/dulwich/tests/data/repos/ooo_merge/b

dulwich/dulwich/tests/data/repos/ooo_merge/c

dulwich/dulwich/tests/data/repos/simple_merge

dulwich/dulwich/tests/data/repos/simple_merge/.git

dulwich/dulwich/tests/data/repos/simple_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/simple_merge/.git/index

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d/89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b/6318f651a534b38f9c7aedeebbd56c1e896853

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c/ffe90e0a41ad3f5190079d7c8f036bde29cbe6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d/ac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60/dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab/64bbdcc51b170d21588e5c5d391ee5c0c96dfd

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4/bdad6549dfedf25d3b89d21f506aff575b28a7

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8/0c186a03f423a81b39df39dc87fd269736ca86

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/simple_merge/a

dulwich/dulwich/tests/data/repos/simple_merge/b

dulwich/dulwich/tests/data/repos/simple_merge/d

dulwich/dulwich/tests/data/repos/simple_merge/e

dulwich/dulwich/tests/data/trees

dulwich/dulwich/tests/data/trees/70c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/test_objects.py

dulwich/dulwich/tests/test_pack.py

dulwich/dulwich/tests/test_repository.py

dulwich/setup.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

remote.py

repository.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_ids.py

tests/test_repository.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""B+Tree indices"""

import cStringIO

from bisect import bisect_right

import math

import tempfile

import zlib

from bzrlib import (

chunk_writer,

debug,

errors,

fifo_cache,

index,

lru_cache,

osutils,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

from bzrlib.transport import get_transport

_BTSIGNATURE = "B+Tree Graph Index 2\n"

_OPTION_ROW_LENGTHS = "row_lengths="

_LEAF_FLAG = "type=leaf\n"

_INTERNAL_FLAG = "type=internal\n"

_INTERNAL_OFFSET = "offset="

_RESERVED_HEADER_BYTES = 120

_PAGE_SIZE = 4096

# 4K per page: 4MB - 1000 entries

_NODE_CACHE_SIZE = 1000

class _BuilderRow(object):

"""The stored state accumulated while writing out a row in the index.

:ivar spool: A temporary file used to accumulate nodes for this row

in the tree.

:ivar nodes: The count of nodes emitted so far.

"""

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = None# tempfile.TemporaryFile(prefix='bzr-index-row-')

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

self.spool = cStringIO.StringIO()

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

elif self.nodes == 1:

# We got bigger than 1 node, switch to a temp file

spool = tempfile.TemporaryFile(prefix='bzr-index-row-')

spool.write(self.spool.getvalue())

self.spool = spool

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

skipped_bytes = padding

self.spool.writelines(byte_lines)

remainder = (self.spool.tell() + skipped_bytes) % _PAGE_SIZE

if remainder != 0:

raise AssertionError("incorrect node length: %d, %d"

% (self.spool.tell(), remainder))

self.nodes += 1

self.writer = None

class _InternalBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out internal rows."""

def finish_node(self, pad=True):

if not pad:

raise AssertionError("Must pad internal nodes only.")

_BuilderRow.finish_node(self)

100

class _LeafBuilderRow(_BuilderRow):

101

"""The stored state accumulated while writing out a leaf rows."""

102

103

104

class BTreeBuilder(index.GraphIndexBuilder):

105

"""A Builder for B+Tree based Graph indices.

106

107

The resulting graph has the structure:

108

109

_SIGNATURE OPTIONS NODES

110

_SIGNATURE := 'B+Tree Graph Index 1' NEWLINE

111

OPTIONS := REF_LISTS KEY_ELEMENTS LENGTH

112

REF_LISTS := 'node_ref_lists=' DIGITS NEWLINE

113

KEY_ELEMENTS := 'key_elements=' DIGITS NEWLINE

114

LENGTH := 'len=' DIGITS NEWLINE

115

ROW_LENGTHS := 'row_lengths' DIGITS (COMMA DIGITS)*

116

NODES := NODE_COMPRESSED*

117

NODE_COMPRESSED:= COMPRESSED_BYTES{4096}

118

NODE_RAW := INTERNAL | LEAF

119

INTERNAL := INTERNAL_FLAG POINTERS

120

LEAF := LEAF_FLAG ROWS

121

KEY_ELEMENT := Not-whitespace-utf8

122

KEY := KEY_ELEMENT (NULL KEY_ELEMENT)*

123

ROWS := ROW*

124

ROW := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

125

ABSENT := 'a'

126

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

127

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

128

REFERENCE := KEY

129

VALUE := no-newline-no-null-bytes

130

"""

131

132

def __init__(self, reference_lists=0, key_elements=1, spill_at=100000):

133

"""See GraphIndexBuilder.__init__.

134

135

:param spill_at: Optional parameter controlling the maximum number

136

of nodes that BTreeBuilder will hold in memory.

137

"""

138

index.GraphIndexBuilder.__init__(self, reference_lists=reference_lists,

139

key_elements=key_elements)

140

self._spill_at = spill_at

141

self._backing_indices = []

142

# A map of {key: (node_refs, value)}

143

self._nodes = {}

144

# Indicate it hasn't been built yet

145

self._nodes_by_key = None

146

self._optimize_for_size = False

147

148

def add_node(self, key, value, references=()):

149

"""Add a node to the index.

150

151

If adding the node causes the builder to reach its spill_at threshold,

152

disk spilling will be triggered.

153

154

:param key: The key. keys are non-empty tuples containing

155

as many whitespace-free utf8 bytestrings as the key length

156

defined for this index.

157

:param references: An iterable of iterables of keys. Each is a

158

reference to another key.

159

:param value: The value to associate with the key. It may be any

160

bytes as long as it does not contain \0 or \n.

161

"""

162

# we don't care about absent_references

163

node_refs, _ = self._check_key_ref_value(key, references, value)

164

if key in self._nodes:

165

raise errors.BadIndexDuplicateKey(key, self)

166

# TODO: StaticTuple

167

self._nodes[key] = (node_refs, value)

168

self._keys.add(key)

169

if self._nodes_by_key is not None and self._key_length > 1:

170

self._update_nodes_by_key(key, value, node_refs)

171

if len(self._keys) < self._spill_at:

172

return

173

self._spill_mem_keys_to_disk()

174

175

def _spill_mem_keys_to_disk(self):

176

"""Write the in memory keys down to disk to cap memory consumption.

177

178

If we already have some keys written to disk, we will combine them so

179

as to preserve the sorted order. The algorithm for combining uses

180

powers of two. So on the first spill, write all mem nodes into a

181

single index. On the second spill, combine the mem nodes with the nodes

182

on disk to create a 2x sized disk index and get rid of the first index.

183

On the third spill, create a single new disk index, which will contain

184

the mem nodes, and preserve the existing 2x sized index. On the fourth,

185

combine mem with the first and second indexes, creating a new one of

186

size 4x. On the fifth create a single new one, etc.

187

"""

188

if self._combine_backing_indices:

189

(new_backing_file, size,

190

backing_pos) = self._spill_mem_keys_and_combine()

191

else:

192

new_backing_file, size = self._spill_mem_keys_without_combining()

193

# Note: The transport here isn't strictly needed, because we will use

194

# direct access to the new_backing._file object

195

new_backing = BTreeGraphIndex(get_transport('.'), '<temp>', size)

196

# GC will clean up the file

197

new_backing._file = new_backing_file

198

if self._combine_backing_indices:

199

if len(self._backing_indices) == backing_pos:

200

self._backing_indices.append(None)

201

self._backing_indices[backing_pos] = new_backing

202

for backing_pos in range(backing_pos):

203

self._backing_indices[backing_pos] = None

204

else:

205

self._backing_indices.append(new_backing)

206

self._keys = set()

207

self._nodes = {}

208

self._nodes_by_key = None

209

210

def _spill_mem_keys_without_combining(self):

211

return self._write_nodes(self._iter_mem_nodes(), allow_optimize=False)

212

213

def _spill_mem_keys_and_combine(self):

214

iterators_to_combine = [self._iter_mem_nodes()]

215

pos = -1

216

for pos, backing in enumerate(self._backing_indices):

217

if backing is None:

218

pos -= 1

219

break

220

iterators_to_combine.append(backing.iter_all_entries())

221

backing_pos = pos + 1

222

new_backing_file, size = \

223

self._write_nodes(self._iter_smallest(iterators_to_combine),

224

allow_optimize=False)

225

return new_backing_file, size, backing_pos

226

227

def add_nodes(self, nodes):

228

"""Add nodes to the index.

229

230

:param nodes: An iterable of (key, node_refs, value) entries to add.

231

"""

232

if self.reference_lists:

233

for (key, value, node_refs) in nodes:

234

self.add_node(key, value, node_refs)

235

else:

236

for (key, value) in nodes:

237

self.add_node(key, value)

238

239

def _iter_mem_nodes(self):

240

"""Iterate over the nodes held in memory."""

241

nodes = self._nodes

242

if self.reference_lists:

243

for key in sorted(nodes):

244

references, value = nodes[key]

245

yield self, key, value, references

246

else:

247

for key in sorted(nodes):

248

references, value = nodes[key]

249

yield self, key, value

250

251

def _iter_smallest(self, iterators_to_combine):

252

if len(iterators_to_combine) == 1:

253

for value in iterators_to_combine[0]:

254

yield value

255

return

256

current_values = []

257

for iterator in iterators_to_combine:

258

try:

259

current_values.append(iterator.next())

260

except StopIteration:

261

current_values.append(None)

262

last = None

263

while True:

264

# Decorate candidates with the value to allow 2.4's min to be used.

265

candidates = [(item[1][1], item) for item

266

in enumerate(current_values) if item[1] is not None]

267

if not len(candidates):

268

return

269

selected = min(candidates)

270

# undecorate back to (pos, node)

271

selected = selected[1]

272

if last == selected[1][1]:

273

raise errors.BadIndexDuplicateKey(last, self)

274

last = selected[1][1]

275

# Yield, with self as the index

276

yield (self,) + selected[1][1:]

277

pos = selected[0]

278

try:

279

current_values[pos] = iterators_to_combine[pos].next()

280

except StopIteration:

281

current_values[pos] = None

282

283

def _add_key(self, string_key, line, rows, allow_optimize=True):

284

"""Add a key to the current chunk.

285

286

:param string_key: The key to add.

287

:param line: The fully serialised key and value.

288

:param allow_optimize: If set to False, prevent setting the optimize

289

flag when writing out. This is used by the _spill_mem_keys_to_disk

290

functionality.

291

"""

292

if rows[-1].writer is None:

293

# opening a new leaf chunk;

294

for pos, internal_row in enumerate(rows[:-1]):

295

# flesh out any internal nodes that are needed to

296

# preserve the height of the tree

297

if internal_row.writer is None:

298

length = _PAGE_SIZE

299

if internal_row.nodes == 0:

300

length -= _RESERVED_HEADER_BYTES # padded

301

if allow_optimize:

302

optimize_for_size = self._optimize_for_size

303

else:

304

optimize_for_size = False

305

internal_row.writer = chunk_writer.ChunkWriter(length, 0,

306

optimize_for_size=optimize_for_size)

307

internal_row.writer.write(_INTERNAL_FLAG)

308

internal_row.writer.write(_INTERNAL_OFFSET +

309

str(rows[pos + 1].nodes) + "\n")

310

# add a new leaf

311

length = _PAGE_SIZE

312

if rows[-1].nodes == 0:

313

length -= _RESERVED_HEADER_BYTES # padded

314

rows[-1].writer = chunk_writer.ChunkWriter(length,

315

optimize_for_size=self._optimize_for_size)

316

rows[-1].writer.write(_LEAF_FLAG)

317

if rows[-1].writer.write(line):

318

# this key did not fit in the node:

319

rows[-1].finish_node()

320

key_line = string_key + "\n"

321

new_row = True

322

for row in reversed(rows[:-1]):

323

# Mark the start of the next node in the node above. If it

324

# doesn't fit then propagate upwards until we find one that

325

# it does fit into.

326

if row.writer.write(key_line):

327

row.finish_node()

328

else:

329

# We've found a node that can handle the pointer.

330

new_row = False

331

break

332

# If we reached the current root without being able to mark the

333

# division point, then we need a new root:

334

if new_row:

335

# We need a new row

336

if 'index' in debug.debug_flags:

337

trace.mutter('Inserting new global row.')

338

new_row = _InternalBuilderRow()

339

reserved_bytes = 0

340

rows.insert(0, new_row)

341

# This will be padded, hence the -100

342

new_row.writer = chunk_writer.ChunkWriter(

343

_PAGE_SIZE - _RESERVED_HEADER_BYTES,

344

reserved_bytes,

345

optimize_for_size=self._optimize_for_size)

346

new_row.writer.write(_INTERNAL_FLAG)

347

new_row.writer.write(_INTERNAL_OFFSET +

348

str(rows[1].nodes - 1) + "\n")

349

new_row.writer.write(key_line)

350

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

351

352

def _write_nodes(self, node_iterator, allow_optimize=True):

353

"""Write node_iterator out as a B+Tree.

354

355

:param node_iterator: An iterator of sorted nodes. Each node should

356

match the output given by iter_all_entries.

357

:param allow_optimize: If set to False, prevent setting the optimize

358

flag when writing out. This is used by the _spill_mem_keys_to_disk

359

functionality.

360

:return: A file handle for a temporary file containing a B+Tree for

361

the nodes.

362

"""

363

# The index rows - rows[0] is the root, rows[1] is the layer under it

364

# etc.

365

rows = []

366

# forward sorted by key. In future we may consider topological sorting,

367

# at the cost of table scans for direct lookup, or a second index for

368

# direct lookup

369

key_count = 0

370

# A stack with the number of nodes of each size. 0 is the root node

371

# and must always be 1 (if there are any nodes in the tree).

372

self.row_lengths = []

373

# Loop over all nodes adding them to the bottom row

374

# (rows[-1]). When we finish a chunk in a row,

375

# propagate the key that didn't fit (comes after the chunk) to the

376

# row above, transitively.

377

for node in node_iterator:

378

if key_count == 0:

379

# First key triggers the first row

380

rows.append(_LeafBuilderRow())

381

key_count += 1

382

string_key, line = _btree_serializer._flatten_node(node,

383

self.reference_lists)

384

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

385

for row in reversed(rows):

386

pad = (type(row) != _LeafBuilderRow)

387

row.finish_node(pad=pad)

388

lines = [_BTSIGNATURE]

389

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

390

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

391

lines.append(_OPTION_LEN + str(key_count) + '\n')

392

row_lengths = [row.nodes for row in rows]

393

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

394

if row_lengths and row_lengths[-1] > 1:

395

result = tempfile.NamedTemporaryFile(prefix='bzr-index-')

396

else:

397

result = cStringIO.StringIO()

398

result.writelines(lines)

399

position = sum(map(len, lines))

400

root_row = True

401

if position > _RESERVED_HEADER_BYTES:

402

raise AssertionError("Could not fit the header in the"

403

" reserved space: %d > %d"

404

% (position, _RESERVED_HEADER_BYTES))

405

# write the rows out:

406

for row in rows:

407

reserved = _RESERVED_HEADER_BYTES # reserved space for first node

408

row.spool.flush()

409

row.spool.seek(0)

410

# copy nodes to the finalised file.

411

# Special case the first node as it may be prefixed

412

node = row.spool.read(_PAGE_SIZE)

413

result.write(node[reserved:])

414

result.write("\x00" * (reserved - position))

415

position = 0 # Only the root row actually has an offset

416

copied_len = osutils.pumpfile(row.spool, result)

417

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

418

if type(row) != _LeafBuilderRow:

419

raise AssertionError("Incorrect amount of data copied"

420

" expected: %d, got: %d"

421

% ((row.nodes - 1) * _PAGE_SIZE,

422

copied_len))

423

result.flush()

424

size = result.tell()

425

result.seek(0)

426

return result, size

427

428

def finish(self):

429

"""Finalise the index.

430

431

:return: A file handle for a temporary file containing the nodes added

432

to the index.

433

"""

434

return self._write_nodes(self.iter_all_entries())[0]

435

436

def iter_all_entries(self):

437

"""Iterate over all keys within the index

438

439

:return: An iterable of (index, key, value, reference_lists). There is

440

no defined order for the result iteration - it will be in the most

441

efficient order for the index (in this case dictionary hash order).

442

"""

443

if 'evil' in debug.debug_flags:

444

trace.mutter_callsite(3,

445

"iter_all_entries scales with size of history.")

446

# Doing serial rather than ordered would be faster; but this shouldn't

447

# be getting called routinely anyway.

448

iterators = [self._iter_mem_nodes()]

449

for backing in self._backing_indices:

450

if backing is not None:

451

iterators.append(backing.iter_all_entries())

452

if len(iterators) == 1:

453

return iterators[0]

454

return self._iter_smallest(iterators)

455

456

def iter_entries(self, keys):

457

"""Iterate over keys within the index.

458

459

:param keys: An iterable providing the keys to be retrieved.

460

:return: An iterable of (index, key, value, reference_lists). There is no

461

defined order for the result iteration - it will be in the most

462

efficient order for the index (keys iteration order in this case).

463

"""

464

keys = set(keys)

465

local_keys = keys.intersection(self._keys)

466

if self.reference_lists:

467

for key in local_keys:

468

node = self._nodes[key]

469

yield self, key, node[1], node[0]

470

else:

471

for key in local_keys:

472

node = self._nodes[key]

473

yield self, key, node[1]

474

# Find things that are in backing indices that have not been handled

475

# yet.

476

if not self._backing_indices:

477

return # We won't find anything there either

478

# Remove all of the keys that we found locally

479

keys.difference_update(local_keys)

480

for backing in self._backing_indices:

481

if backing is None:

482

continue

483

if not keys:

484

return

485

for node in backing.iter_entries(keys):

486

keys.remove(node[1])

487

yield (self,) + node[1:]

488

489

def iter_entries_prefix(self, keys):

490

"""Iterate over keys within the index using prefix matching.

491

492

Prefix matching is applied within the tuple of a key, not to within

493

the bytestring of each key element. e.g. if you have the keys ('foo',

494

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

495

only the former key is returned.

496

497

:param keys: An iterable providing the key prefixes to be retrieved.

498

Each key prefix takes the form of a tuple the length of a key, but

499

with the last N elements 'None' rather than a regular bytestring.

500

The first element cannot be 'None'.

501

:return: An iterable as per iter_all_entries, but restricted to the

502

keys with a matching prefix to those supplied. No additional keys

503

will be returned, and every match that is in the index will be

504

returned.

505

"""

506

# XXX: To much duplication with the GraphIndex class; consider finding

507

# a good place to pull out the actual common logic.

508

keys = set(keys)

509

if not keys:

510

return

511

for backing in self._backing_indices:

512

if backing is None:

513

continue

514

for node in backing.iter_entries_prefix(keys):

515

yield (self,) + node[1:]

516

if self._key_length == 1:

517

for key in keys:

518

# sanity check

519

if key[0] is None:

520

raise errors.BadIndexKey(key)

521

if len(key) != self._key_length:

522

raise errors.BadIndexKey(key)

523

try:

524

node = self._nodes[key]

525

except KeyError:

526

continue

527

if self.reference_lists:

528

yield self, key, node[1], node[0]

529

else:

530

yield self, key, node[1]

531

return

532

for key in keys:

533

# sanity check

534

if key[0] is None:

535

raise errors.BadIndexKey(key)

536

if len(key) != self._key_length:

537

raise errors.BadIndexKey(key)

538

# find what it refers to:

539

key_dict = self._get_nodes_by_key()

540

elements = list(key)

541

# find the subdict to return

542

try:

543

while len(elements) and elements[0] is not None:

544

key_dict = key_dict[elements[0]]

545

elements.pop(0)

546

except KeyError:

547

# a non-existant lookup.

548

continue

549

if len(elements):

550

dicts = [key_dict]

551

while dicts:

552

key_dict = dicts.pop(-1)

553

# can't be empty or would not exist

554

item, value = key_dict.iteritems().next()

555

if type(value) == dict:

556

# push keys

557

dicts.extend(key_dict.itervalues())

558

else:

559

# yield keys

560

for value in key_dict.itervalues():

561

yield (self, ) + value

562

else:

563

yield (self, ) + key_dict

564

565

def _get_nodes_by_key(self):

566

if self._nodes_by_key is None:

567

nodes_by_key = {}

568

if self.reference_lists:

569

for key, (references, value) in self._nodes.iteritems():

570

key_dict = nodes_by_key

571

for subkey in key[:-1]:

572

key_dict = key_dict.setdefault(subkey, {})

573

key_dict[key[-1]] = key, value, references

574

else:

575

for key, (references, value) in self._nodes.iteritems():

576

key_dict = nodes_by_key

577

for subkey in key[:-1]:

578

key_dict = key_dict.setdefault(subkey, {})

579

key_dict[key[-1]] = key, value

580

self._nodes_by_key = nodes_by_key

581

return self._nodes_by_key

582

583

def key_count(self):

584

"""Return an estimate of the number of keys in this index.

585

586

For InMemoryGraphIndex the estimate is exact.

587

"""

588

return len(self._keys) + sum(backing.key_count() for backing in

589

self._backing_indices if backing is not None)

590

591

def validate(self):

592

"""In memory index's have no known corruption at the moment."""

593

594

595

class _LeafNode(object):

596

"""A leaf node for a serialised B+Tree index."""

597

598

__slots__ = ('keys', 'min_key', 'max_key')

599

600

def __init__(self, bytes, key_length, ref_list_length):

601

"""Parse bytes to create a leaf node object."""

602

# splitlines mangles the \r delimiters.. don't use it.

603

key_list = _btree_serializer._parse_leaf_lines(bytes,

604

key_length, ref_list_length)

605

if key_list:

606

self.min_key = key_list[0][0]

607

self.max_key = key_list[-1][0]

608

else:

609

self.min_key = self.max_key = None

610

self.keys = dict(key_list)

611

612

613

class _InternalNode(object):

614

"""An internal node for a serialised B+Tree index."""

615

616

__slots__ = ('keys', 'offset')

617

618

def __init__(self, bytes):

619

"""Parse bytes to create an internal node object."""

620

# splitlines mangles the \r delimiters.. don't use it.

621

self.keys = self._parse_lines(bytes.split('\n'))

622

623

def _parse_lines(self, lines):

624

nodes = []

625

self.offset = int(lines[1][7:])

626

for line in lines[2:]:

627

if line == '':

628

break

629

# TODO: Switch to StaticTuple here.

630

nodes.append(tuple(map(intern, line.split('\0'))))

631

return nodes

632

633

634

class BTreeGraphIndex(object):

635

"""Access to nodes via the standard GraphIndex interface for B+Tree's.

636

637

Individual nodes are held in a LRU cache. This holds the root node in

638

memory except when very large walks are done.

639

"""

640

641

def __init__(self, transport, name, size):

642

"""Create a B+Tree index object on the index name.

643

644

:param transport: The transport to read data for the index from.

645

:param name: The file name of the index on transport.

646

:param size: Optional size of the index in bytes. This allows

647

compatibility with the GraphIndex API, as well as ensuring that

648

the initial read (to read the root node header) can be done

649

without over-reading even on empty indices, and on small indices

650

allows single-IO to read the entire index.

651

"""

652

self._transport = transport

653

self._name = name

654

self._size = size

655

self._file = None

656

self._recommended_pages = self._compute_recommended_pages()

657

self._root_node = None

658

# Default max size is 100,000 leave values

659

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

660

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

661

# We could limit this, but even a 300k record btree has only 3k leaf

662

# nodes, and only 20 internal nodes. So the default of 100 nodes in an

663

# LRU would mean we always cache everything anyway, no need to pay the

664

# overhead of LRU

665

self._internal_node_cache = fifo_cache.FIFOCache(100)

666

self._key_count = None

667

self._row_lengths = None

668

self._row_offsets = None # Start of each row, [-1] is the end

669

670

def __eq__(self, other):

671

"""Equal when self and other were created with the same parameters."""

672

return (

673

type(self) == type(other) and

674

self._transport == other._transport and

675

self._name == other._name and

676

self._size == other._size)

677

678

def __ne__(self, other):

679

return not self.__eq__(other)

680

681

def _get_and_cache_nodes(self, nodes):

682

"""Read nodes and cache them in the lru.

683

684

The nodes list supplied is sorted and then read from disk, each node

685

being inserted it into the _node_cache.

686

687

Note: Asking for more nodes than the _node_cache can contain will

688

result in some of the results being immediately discarded, to prevent

689

this an assertion is raised if more nodes are asked for than are

690

cachable.

691

692

:return: A dict of {node_pos: node}

693

"""

694

found = {}

695

start_of_leaves = None

696

for node_pos, node in self._read_nodes(sorted(nodes)):

697

if node_pos == 0: # Special case

698

self._root_node = node

699

else:

700

if start_of_leaves is None:

701

start_of_leaves = self._row_offsets[-2]

702

if node_pos < start_of_leaves:

703

self._internal_node_cache.add(node_pos, node)

704

else:

705

self._leaf_node_cache.add(node_pos, node)

706

found[node_pos] = node

707

return found

708

709

def _compute_recommended_pages(self):

710

"""Convert transport's recommended_page_size into btree pages.

711

712

recommended_page_size is in bytes, we want to know how many _PAGE_SIZE

713

pages fit in that length.

714

"""

715

recommended_read = self._transport.recommended_page_size()

716

recommended_pages = int(math.ceil(recommended_read /

717

float(_PAGE_SIZE)))

718

return recommended_pages

719

720

def _compute_total_pages_in_index(self):

721

"""How many pages are in the index.

722

723

If we have read the header we will use the value stored there.

724

Otherwise it will be computed based on the length of the index.

725

"""

726

if self._size is None:

727

raise AssertionError('_compute_total_pages_in_index should not be'

728

' called when self._size is None')

729

if self._root_node is not None:

730

# This is the number of pages as defined by the header

731

return self._row_offsets[-1]

732

# This is the number of pages as defined by the size of the index. They

733

# should be indentical.

734

total_pages = int(math.ceil(self._size / float(_PAGE_SIZE)))

735

return total_pages

736

737

def _expand_offsets(self, offsets):

738

"""Find extra pages to download.

739

740

The idea is that we always want to make big-enough requests (like 64kB

741

for http), so that we don't waste round trips. So given the entries

742

that we already have cached and the new pages being downloaded figure

743

out what other pages we might want to read.

744

745

See also doc/developers/btree_index_prefetch.txt for more details.

746

747

:param offsets: The offsets to be read

748

:return: A list of offsets to download

749

"""

750

if 'index' in debug.debug_flags:

751

trace.mutter('expanding: %s\toffsets: %s', self._name, offsets)

752

753

if len(offsets) >= self._recommended_pages:

754

# Don't add more, we are already requesting more than enough

755

if 'index' in debug.debug_flags:

756

trace.mutter(' not expanding large request (%s >= %s)',

757

len(offsets), self._recommended_pages)

758

return offsets

759

if self._size is None:

760

# Don't try anything, because we don't know where the file ends

761

if 'index' in debug.debug_flags:

762

trace.mutter(' not expanding without knowing index size')

763

return offsets

764

total_pages = self._compute_total_pages_in_index()

765

cached_offsets = self._get_offsets_to_cached_pages()

766

# If reading recommended_pages would read the rest of the index, just

767

# do so.

768

if total_pages - len(cached_offsets) <= self._recommended_pages:

769

# Read whatever is left

770

if cached_offsets:

771

expanded = [x for x in xrange(total_pages)

772

if x not in cached_offsets]

773

else:

774

expanded = range(total_pages)

775

if 'index' in debug.debug_flags:

776

trace.mutter(' reading all unread pages: %s', expanded)

777

return expanded

778

779

if self._root_node is None:

780

# ATM on the first read of the root node of a large index, we don't

781

# bother pre-reading any other pages. This is because the

782

# likelyhood of actually reading interesting pages is very low.

783

# See doc/developers/btree_index_prefetch.txt for a discussion, and

784

# a possible implementation when we are guessing that the second

785

# layer index is small

786

final_offsets = offsets

787

else:

788

tree_depth = len(self._row_lengths)

789

if len(cached_offsets) < tree_depth and len(offsets) == 1:

790

# We haven't read enough to justify expansion

791

# If we are only going to read the root node, and 1 leaf node,

792

# then it isn't worth expanding our request. Once we've read at

793

# least 2 nodes, then we are probably doing a search, and we

794

# start expanding our requests.

795

if 'index' in debug.debug_flags:

796

trace.mutter(' not expanding on first reads')

797

return offsets

798

final_offsets = self._expand_to_neighbors(offsets, cached_offsets,

799

total_pages)

800

801

final_offsets = sorted(final_offsets)

802

if 'index' in debug.debug_flags:

803

trace.mutter('expanded: %s', final_offsets)

804

return final_offsets

805

806

def _expand_to_neighbors(self, offsets, cached_offsets, total_pages):

807

"""Expand requests to neighbors until we have enough pages.

808

809

This is called from _expand_offsets after policy has determined that we

810

want to expand.

811

We only want to expand requests within a given layer. We cheat a little

812

bit and assume all requests will be in the same layer. This is true

813

given the current design, but if it changes this algorithm may perform

814

oddly.

815

816

:param offsets: requested offsets

817

:param cached_offsets: offsets for pages we currently have cached

818

:return: A set() of offsets after expansion

819

"""

820

final_offsets = set(offsets)

821

first = end = None

822

new_tips = set(final_offsets)

823

while len(final_offsets) < self._recommended_pages and new_tips:

824

next_tips = set()

825

for pos in new_tips:

826

if first is None:

827

first, end = self._find_layer_first_and_end(pos)

828

previous = pos - 1

829

if (previous > 0

830

and previous not in cached_offsets

831

and previous not in final_offsets

832

and previous >= first):

833

next_tips.add(previous)

834

after = pos + 1

835

if (after < total_pages

836

and after not in cached_offsets

837

and after not in final_offsets

838

and after < end):

839

next_tips.add(after)

840

# This would keep us from going bigger than

841

# recommended_pages by only expanding the first offsets.

842

# However, if we are making a 'wide' request, it is

843

# reasonable to expand all points equally.

844

# if len(final_offsets) > recommended_pages:

845

# break

846

final_offsets.update(next_tips)

847

new_tips = next_tips

848

return final_offsets

849

850

def external_references(self, ref_list_num):

851

if self._root_node is None:

852

self._get_root_node()

853

if ref_list_num + 1 > self.node_ref_lists:

854

raise ValueError('No ref list %d, index has %d ref lists'

855

% (ref_list_num, self.node_ref_lists))

856

keys = set()

857

refs = set()

858

for node in self.iter_all_entries():

859

keys.add(node[1])

860

refs.update(node[3][ref_list_num])

861

return refs - keys

862

863

def _find_layer_first_and_end(self, offset):

864

"""Find the start/stop nodes for the layer corresponding to offset.

865

866

:return: (first, end)

867

first is the first node in this layer

868

end is the first node of the next layer

869

"""

870

first = end = 0

871

for roffset in self._row_offsets:

872

first = end

873

end = roffset

874

if offset < roffset:

875

break

876

return first, end

877

878

def _get_offsets_to_cached_pages(self):

879

"""Determine what nodes we already have cached."""

880

cached_offsets = set(self._internal_node_cache.keys())

881

cached_offsets.update(self._leaf_node_cache.keys())

882

if self._root_node is not None:

883

cached_offsets.add(0)

884

return cached_offsets

885

886

def _get_root_node(self):

887

if self._root_node is None:

888

# We may not have a root node yet

889

self._get_internal_nodes([0])

890

return self._root_node

891

892

def _get_nodes(self, cache, node_indexes):

893

found = {}

894

needed = []

895

for idx in node_indexes:

896

if idx == 0 and self._root_node is not None:

897

found[0] = self._root_node

898

continue

899

try:

900

found[idx] = cache[idx]

901

except KeyError:

902

needed.append(idx)

903

if not needed:

904

return found

905

needed = self._expand_offsets(needed)

906

found.update(self._get_and_cache_nodes(needed))

907

return found

908

909

def _get_internal_nodes(self, node_indexes):

910

"""Get a node, from cache or disk.

911

912

After getting it, the node will be cached.

913

"""

914

return self._get_nodes(self._internal_node_cache, node_indexes)

915

916

def _cache_leaf_values(self, nodes):

917

"""Cache directly from key => value, skipping the btree."""

918

if self._leaf_value_cache is not None:

919

for node in nodes.itervalues():

920

for key, value in node.keys.iteritems():

921

if key in self._leaf_value_cache:

922

# Don't add the rest of the keys, we've seen this node

923

# before.

924

break

925

self._leaf_value_cache[key] = value

926

927

def _get_leaf_nodes(self, node_indexes):

928

"""Get a bunch of nodes, from cache or disk."""

929

found = self._get_nodes(self._leaf_node_cache, node_indexes)

930

self._cache_leaf_values(found)

931

return found

932

933

def iter_all_entries(self):

934

"""Iterate over all keys within the index.

935

936

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

937

The former tuple is used when there are no reference lists in the

938

index, making the API compatible with simple key:value index types.

939

There is no defined order for the result iteration - it will be in

940

the most efficient order for the index.

941

"""

942

if 'evil' in debug.debug_flags:

943

trace.mutter_callsite(3,

944

"iter_all_entries scales with size of history.")

945

if not self.key_count():

946

return

947

if self._row_offsets[-1] == 1:

948

# There is only the root node, and we read that via key_count()

949

if self.node_ref_lists:

950

for key, (value, refs) in sorted(self._root_node.keys.items()):

951

yield (self, key, value, refs)

952

else:

953

for key, (value, refs) in sorted(self._root_node.keys.items()):

954

yield (self, key, value)

955

return

956

start_of_leaves = self._row_offsets[-2]

957

end_of_leaves = self._row_offsets[-1]

958

needed_offsets = range(start_of_leaves, end_of_leaves)

959

if needed_offsets == [0]:

960

# Special case when we only have a root node, as we have already

961

# read everything

962

nodes = [(0, self._root_node)]

963

else:

964

nodes = self._read_nodes(needed_offsets)

965

# We iterate strictly in-order so that we can use this function

966

# for spilling index builds to disk.

967

if self.node_ref_lists:

968

for _, node in nodes:

969

for key, (value, refs) in sorted(node.keys.items()):

970

yield (self, key, value, refs)

971

else:

972

for _, node in nodes:

973

for key, (value, refs) in sorted(node.keys.items()):

974

yield (self, key, value)

975

976

@staticmethod

977

def _multi_bisect_right(in_keys, fixed_keys):

978

"""Find the positions where each 'in_key' would fit in fixed_keys.

979

980

This is equivalent to doing "bisect_right" on each in_key into

981

fixed_keys

982

983

:param in_keys: A sorted list of keys to match with fixed_keys

984

:param fixed_keys: A sorted list of keys to match against

985

:return: A list of (integer position, [key list]) tuples.

986

"""

987

if not in_keys:

988

return []

989

if not fixed_keys:

990

# no pointers in the fixed_keys list, which means everything must

991

# fall to the left.

992

return [(0, in_keys)]

993

994

# TODO: Iterating both lists will generally take M + N steps

995

# Bisecting each key will generally take M * log2 N steps.

996

# If we had an efficient way to compare, we could pick the method

997

# based on which has the fewer number of steps.

998

# There is also the argument that bisect_right is a compiled

999

# function, so there is even more to be gained.

1000

# iter_steps = len(in_keys) + len(fixed_keys)

1001

# bisect_steps = len(in_keys) * math.log(len(fixed_keys), 2)

1002

if len(in_keys) == 1: # Bisect will always be faster for M = 1

1003

return [(bisect_right(fixed_keys, in_keys[0]), in_keys)]

1004

# elif bisect_steps < iter_steps:

1005

# offsets = {}

1006

# for key in in_keys:

1007

# offsets.setdefault(bisect_right(fixed_keys, key),

1008

# []).append(key)

1009

# return [(o, offsets[o]) for o in sorted(offsets)]

1010

in_keys_iter = iter(in_keys)

1011

fixed_keys_iter = enumerate(fixed_keys)

1012

cur_in_key = in_keys_iter.next()

1013

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1014

1015

class InputDone(Exception): pass

1016

class FixedDone(Exception): pass

1017

1018

output = []

1019

cur_out = []

1020

1021

# TODO: Another possibility is that rather than iterating on each side,

1022

# we could use a combination of bisecting and iterating. For

1023

# example, while cur_in_key < fixed_key, bisect to find its

1024

# point, then iterate all matching keys, then bisect (restricted

1025

# to only the remainder) for the next one, etc.

1026

try:

1027

while True:

1028

if cur_in_key < cur_fixed_key:

1029

cur_keys = []

1030

cur_out = (cur_fixed_offset, cur_keys)

1031

output.append(cur_out)

1032

while cur_in_key < cur_fixed_key:

1033

cur_keys.append(cur_in_key)

1034

try:

1035

cur_in_key = in_keys_iter.next()

1036

except StopIteration:

1037

raise InputDone

1038

# At this point cur_in_key must be >= cur_fixed_key

1039

# step the cur_fixed_key until we pass the cur key, or walk off

1040

# the end

1041

while cur_in_key >= cur_fixed_key:

1042

try:

1043

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1044

except StopIteration:

1045

raise FixedDone

1046

except InputDone:

1047

# We consumed all of the input, nothing more to do

1048

pass

1049

except FixedDone:

1050

# There was some input left, but we consumed all of fixed, so we

1051

# have to add one more for the tail

1052

cur_keys = [cur_in_key]

1053

cur_keys.extend(in_keys_iter)

1054

cur_out = (len(fixed_keys), cur_keys)

1055

output.append(cur_out)

1056

return output

1057

1058

def _walk_through_internal_nodes(self, keys):

1059

"""Take the given set of keys, and find the corresponding LeafNodes.

1060

1061

:param keys: An unsorted iterable of keys to search for

1062

:return: (nodes, index_and_keys)

1063

nodes is a dict mapping {index: LeafNode}

1064

keys_at_index is a list of tuples of [(index, [keys for Leaf])]

1065

"""

1066

# 6 seconds spent in miss_torture using the sorted() line.

1067

# Even with out of order disk IO it seems faster not to sort it when

1068

# large queries are being made.

1069

keys_at_index = [(0, sorted(keys))]

1070

1071

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1072

node_indexes = [idx for idx, s_keys in keys_at_index]

1073

nodes = self._get_internal_nodes(node_indexes)

1074

1075

next_nodes_and_keys = []

1076

for node_index, sub_keys in keys_at_index:

1077

node = nodes[node_index]

1078

positions = self._multi_bisect_right(sub_keys, node.keys)

1079

node_offset = next_row_start + node.offset

1080

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1081

for pos, s_keys in positions])

1082

keys_at_index = next_nodes_and_keys

1083

# We should now be at the _LeafNodes

1084

node_indexes = [idx for idx, s_keys in keys_at_index]

1085

1086

# TODO: We may *not* want to always read all the nodes in one

1087

# big go. Consider setting a max size on this.

1088

nodes = self._get_leaf_nodes(node_indexes)

1089

return nodes, keys_at_index

1090

1091

def iter_entries(self, keys):

1092

"""Iterate over keys within the index.

1093

1094

:param keys: An iterable providing the keys to be retrieved.

1095

:return: An iterable as per iter_all_entries, but restricted to the

1096

keys supplied. No additional keys will be returned, and every

1097

key supplied that is in the index will be returned.

1098

"""

1099

# 6 seconds spent in miss_torture using the sorted() line.

1100

# Even with out of order disk IO it seems faster not to sort it when

1101

# large queries are being made.

1102

# However, now that we are doing multi-way bisecting, we need the keys

1103

# in sorted order anyway. We could change the multi-way code to not

1104

# require sorted order. (For example, it bisects for the first node,

1105

# does an in-order search until a key comes before the current point,

1106

# which it then bisects for, etc.)

1107

keys = frozenset(keys)

1108

if not keys:

1109

return

1110

1111

if not self.key_count():

1112

return

1113

1114

needed_keys = []

1115

if self._leaf_value_cache is None:

1116

needed_keys = keys

1117

else:

1118

for key in keys:

1119

value = self._leaf_value_cache.get(key, None)

1120

if value is not None:

1121

# This key is known not to be here, skip it

1122

value, refs = value

1123

if self.node_ref_lists:

1124

yield (self, key, value, refs)

1125

else:

1126

yield (self, key, value)

1127

else:

1128

needed_keys.append(key)

1129

1130

last_key = None

1131

needed_keys = keys

1132

if not needed_keys:

1133

return

1134

nodes, nodes_and_keys = self._walk_through_internal_nodes(needed_keys)

1135

for node_index, sub_keys in nodes_and_keys:

1136

if not sub_keys:

1137

continue

1138

node = nodes[node_index]

1139

for next_sub_key in sub_keys:

1140

if next_sub_key in node.keys:

1141

value, refs = node.keys[next_sub_key]

1142

if self.node_ref_lists:

1143

yield (self, next_sub_key, value, refs)

1144

else:

1145

yield (self, next_sub_key, value)

1146

1147

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

1148

"""Find the parent_map information for the set of keys.

1149

1150

This populates the parent_map dict and missing_keys set based on the

1151

queried keys. It also can fill out an arbitrary number of parents that

1152

it finds while searching for the supplied keys.

1153

1154

It is unlikely that you want to call this directly. See

1155

"CombinedGraphIndex.find_ancestry()" for a more appropriate API.

1156

1157

:param keys: A keys whose ancestry we want to return

1158

Every key will either end up in 'parent_map' or 'missing_keys'.

1159

:param ref_list_num: This index in the ref_lists is the parents we

1160

care about.

1161

:param parent_map: {key: parent_keys} for keys that are present in this

1162

index. This may contain more entries than were in 'keys', that are

1163

reachable ancestors of the keys requested.

1164

:param missing_keys: keys which are known to be missing in this index.

1165

This may include parents that were not directly requested, but we

1166

were able to determine that they are not present in this index.

1167

:return: search_keys parents that were found but not queried to know

1168

if they are missing or present. Callers can re-query this index for

1169

those keys, and they will be placed into parent_map or missing_keys

1170

"""

1171

if not self.key_count():

1172

# We use key_count() to trigger reading the root node and

1173

# determining info about this BTreeGraphIndex

1174

# If we don't have any keys, then everything is missing

1175

missing_keys.update(keys)

1176

return set()

1177

if ref_list_num >= self.node_ref_lists:

1178

raise ValueError('No ref list %d, index has %d ref lists'

1179

% (ref_list_num, self.node_ref_lists))

1180

1181

# The main trick we are trying to accomplish is that when we find a

1182

# key listing its parents, we expect that the parent key is also likely

1183

# to sit on the same page. Allowing us to expand parents quickly

1184

# without suffering the full stack of bisecting, etc.

1185

nodes, nodes_and_keys = self._walk_through_internal_nodes(keys)

1186

1187

# These are parent keys which could not be immediately resolved on the

1188

# page where the child was present. Note that we may already be

1189

# searching for that key, and it may actually be present [or known

1190

# missing] on one of the other pages we are reading.

1191

# TODO:

1192

# We could try searching for them in the immediate previous or next

1193

# page. If they occur "later" we could put them in a pending lookup

1194

# set, and then for each node we read thereafter we could check to

1195

# see if they are present.

1196

# However, we don't know the impact of keeping this list of things

1197

# that I'm going to search for every node I come across from here on

1198

# out.

1199

# It doesn't handle the case when the parent key is missing on a

1200

# page that we *don't* read. So we already have to handle being

1201

# re-entrant for that.

1202

# Since most keys contain a date string, they are more likely to be

1203

# found earlier in the file than later, but we would know that right

1204

# away (key < min_key), and wouldn't keep searching it on every other

1205

# page that we read.

1206

# Mostly, it is an idea, one which should be benchmarked.

1207

parents_not_on_page = set()

1208

1209

for node_index, sub_keys in nodes_and_keys:

1210

if not sub_keys:

1211

continue

1212

# sub_keys is all of the keys we are looking for that should exist

1213

# on this page, if they aren't here, then they won't be found

1214

node = nodes[node_index]

1215

node_keys = node.keys

1216

parents_to_check = set()

1217

for next_sub_key in sub_keys:

1218

if next_sub_key not in node_keys:

1219

# This one is just not present in the index at all

1220

missing_keys.add(next_sub_key)

1221

else:

1222

value, refs = node_keys[next_sub_key]

1223

parent_keys = refs[ref_list_num]

1224

parent_map[next_sub_key] = parent_keys

1225

parents_to_check.update(parent_keys)

1226

# Don't look for things we've already found

1227

parents_to_check = parents_to_check.difference(parent_map)

1228

# this can be used to test the benefit of having the check loop

1229

# inlined.

1230

# parents_not_on_page.update(parents_to_check)

1231

# continue

1232

while parents_to_check:

1233

next_parents_to_check = set()

1234

for key in parents_to_check:

1235

if key in node_keys:

1236

value, refs = node_keys[key]

1237

parent_keys = refs[ref_list_num]

1238

parent_map[key] = parent_keys

1239

next_parents_to_check.update(parent_keys)

1240

else:

1241

# This parent either is genuinely missing, or should be

1242

# found on another page. Perf test whether it is better

1243

# to check if this node should fit on this page or not.

1244

# in the 'everything-in-one-pack' scenario, this *not*

1245

# doing the check is 237ms vs 243ms.

1246

# So slightly better, but I assume the standard 'lots

1247

# of packs' is going to show a reasonable improvement

1248

# from the check, because it avoids 'going around

1249

# again' for everything that is in another index

1250

# parents_not_on_page.add(key)

1251

# Missing for some reason

1252

if key < node.min_key:

1253

# in the case of bzr.dev, 3.4k/5.3k misses are

1254

# 'earlier' misses (65%)

1255

parents_not_on_page.add(key)

1256

elif key > node.max_key:

1257

# This parent key would be present on a different

1258

# LeafNode

1259

parents_not_on_page.add(key)

1260

else:

1261

# assert key != node.min_key and key != node.max_key

1262

# If it was going to be present, it would be on

1263

# *this* page, so mark it missing.

1264

missing_keys.add(key)

1265

parents_to_check = next_parents_to_check.difference(parent_map)

1266

# Might want to do another .difference() from missing_keys

1267

# parents_not_on_page could have been found on a different page, or be

1268

# known to be missing. So cull out everything that has already been

1269

# found.

1270

search_keys = parents_not_on_page.difference(

1271

parent_map).difference(missing_keys)

1272

return search_keys

1273

1274

def iter_entries_prefix(self, keys):

1275

"""Iterate over keys within the index using prefix matching.

1276

1277

Prefix matching is applied within the tuple of a key, not to within

1278

the bytestring of each key element. e.g. if you have the keys ('foo',

1279

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1280

only the former key is returned.

1281

1282

WARNING: Note that this method currently causes a full index parse

1283

unconditionally (which is reasonably appropriate as it is a means for

1284

thunking many small indices into one larger one and still supplies

1285

iter_all_entries at the thunk layer).

1286

1287

:param keys: An iterable providing the key prefixes to be retrieved.

1288

Each key prefix takes the form of a tuple the length of a key, but

1289

with the last N elements 'None' rather than a regular bytestring.

1290

The first element cannot be 'None'.

1291

:return: An iterable as per iter_all_entries, but restricted to the

1292

keys with a matching prefix to those supplied. No additional keys

1293

will be returned, and every match that is in the index will be

1294

returned.

1295

"""

1296

keys = sorted(set(keys))

1297

if not keys:

1298

return

1299

# Load if needed to check key lengths

1300

if self._key_count is None:

1301

self._get_root_node()

1302

# TODO: only access nodes that can satisfy the prefixes we are looking

1303

# for. For now, to meet API usage (as this function is not used by

1304

# current bzrlib) just suck the entire index and iterate in memory.

1305

nodes = {}

1306

if self.node_ref_lists:

1307

if self._key_length == 1:

1308

for _1, key, value, refs in self.iter_all_entries():

1309

nodes[key] = value, refs

1310

else:

1311

nodes_by_key = {}

1312

for _1, key, value, refs in self.iter_all_entries():

1313

key_value = key, value, refs

1314

# For a key of (foo, bar, baz) create

1315

# _nodes_by_key[foo][bar][baz] = key_value

1316

key_dict = nodes_by_key

1317

for subkey in key[:-1]:

1318

key_dict = key_dict.setdefault(subkey, {})

1319

key_dict[key[-1]] = key_value

1320

else:

1321

if self._key_length == 1:

1322

for _1, key, value in self.iter_all_entries():

1323

nodes[key] = value

1324

else:

1325

nodes_by_key = {}

1326

for _1, key, value in self.iter_all_entries():

1327

key_value = key, value

1328

# For a key of (foo, bar, baz) create

1329

# _nodes_by_key[foo][bar][baz] = key_value

1330

key_dict = nodes_by_key

1331

for subkey in key[:-1]:

1332

key_dict = key_dict.setdefault(subkey, {})

1333

key_dict[key[-1]] = key_value

1334

if self._key_length == 1:

1335

for key in keys:

1336

# sanity check

1337

if key[0] is None:

1338

raise errors.BadIndexKey(key)

1339

if len(key) != self._key_length:

1340

raise errors.BadIndexKey(key)

1341

try:

1342

if self.node_ref_lists:

1343

value, node_refs = nodes[key]

1344

yield self, key, value, node_refs

1345

else:

1346

yield self, key, nodes[key]

1347

except KeyError:

1348

pass

1349

return

1350

for key in keys:

1351

# sanity check

1352

if key[0] is None:

1353

raise errors.BadIndexKey(key)

1354

if len(key) != self._key_length:

1355

raise errors.BadIndexKey(key)

1356

# find what it refers to:

1357

key_dict = nodes_by_key

1358

elements = list(key)

1359

# find the subdict whose contents should be returned.

1360

try:

1361

while len(elements) and elements[0] is not None:

1362

key_dict = key_dict[elements[0]]

1363

elements.pop(0)

1364

except KeyError:

1365

# a non-existant lookup.

1366

continue

1367

if len(elements):

1368

dicts = [key_dict]

1369

while dicts:

1370

key_dict = dicts.pop(-1)

1371

# can't be empty or would not exist

1372

item, value = key_dict.iteritems().next()

1373

if type(value) == dict:

1374

# push keys

1375

dicts.extend(key_dict.itervalues())

1376

else:

1377

# yield keys

1378

for value in key_dict.itervalues():

1379

# each value is the key:value:node refs tuple

1380

# ready to yield.

1381

yield (self, ) + value

1382

else:

1383

# the last thing looked up was a terminal element

1384

yield (self, ) + key_dict

1385

1386

def key_count(self):

1387

"""Return an estimate of the number of keys in this index.

1388

1389

For BTreeGraphIndex the estimate is exact as it is contained in the

1390

header.

1391

"""

1392

if self._key_count is None:

1393

self._get_root_node()

1394

return self._key_count

1395

1396

def _compute_row_offsets(self):

1397

"""Fill out the _row_offsets attribute based on _row_lengths."""

1398

offsets = []

1399

row_offset = 0

1400

for row in self._row_lengths:

1401

offsets.append(row_offset)

1402

row_offset += row

1403

offsets.append(row_offset)

1404

self._row_offsets = offsets

1405

1406

def _parse_header_from_bytes(self, bytes):

1407

"""Parse the header from a region of bytes.

1408

1409

:param bytes: The data to parse.

1410

:return: An offset, data tuple such as readv yields, for the unparsed

1411

data. (which may be of length 0).

1412

"""

1413

signature = bytes[0:len(self._signature())]

1414

if not signature == self._signature():

1415

raise errors.BadIndexFormatSignature(self._name, BTreeGraphIndex)

1416

lines = bytes[len(self._signature()):].splitlines()

1417

options_line = lines[0]

1418

if not options_line.startswith(_OPTION_NODE_REFS):

1419

raise errors.BadIndexOptions(self)

1420

try:

1421

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

1422

except ValueError:

1423

raise errors.BadIndexOptions(self)

1424

options_line = lines[1]

1425

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

1426

raise errors.BadIndexOptions(self)

1427

try:

1428

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

1429

except ValueError:

1430

raise errors.BadIndexOptions(self)

1431

options_line = lines[2]

1432

if not options_line.startswith(_OPTION_LEN):

1433

raise errors.BadIndexOptions(self)

1434

try:

1435

self._key_count = int(options_line[len(_OPTION_LEN):])

1436

except ValueError:

1437

raise errors.BadIndexOptions(self)

1438

options_line = lines[3]

1439

if not options_line.startswith(_OPTION_ROW_LENGTHS):

1440

raise errors.BadIndexOptions(self)

1441

try:

1442

self._row_lengths = map(int, [length for length in

1443

options_line[len(_OPTION_ROW_LENGTHS):].split(',')

1444

if len(length)])

1445

except ValueError:

1446

raise errors.BadIndexOptions(self)

1447

self._compute_row_offsets()

1448

1449

# calculate the bytes we have processed

1450

header_end = (len(signature) + sum(map(len, lines[0:4])) + 4)

1451

return header_end, bytes[header_end:]

1452

1453

def _read_nodes(self, nodes):

1454

"""Read some nodes from disk into the LRU cache.

1455

1456

This performs a readv to get the node data into memory, and parses each

1457

node, then yields it to the caller. The nodes are requested in the

1458

supplied order. If possible doing sort() on the list before requesting

1459

a read may improve performance.

1460

1461

:param nodes: The nodes to read. 0 - first node, 1 - second node etc.

1462

:return: None

1463

"""

1464

# may be the byte string of the whole file

1465

bytes = None

1466

# list of (offset, length) regions of the file that should, evenually

1467

# be read in to data_ranges, either from 'bytes' or from the transport

1468

ranges = []

1469

for index in nodes:

1470

offset = index * _PAGE_SIZE

1471

size = _PAGE_SIZE

1472

if index == 0:

1473

# Root node - special case

1474

if self._size:

1475

size = min(_PAGE_SIZE, self._size)

1476

else:

1477

# The only case where we don't know the size, is for very

1478

# small indexes. So we read the whole thing

1479

bytes = self._transport.get_bytes(self._name)

1480

self._size = len(bytes)

1481

# the whole thing should be parsed out of 'bytes'

1482

ranges.append((0, len(bytes)))

1483

break

1484

else:

1485

if offset > self._size:

1486

raise AssertionError('tried to read past the end'

1487

' of the file %s > %s'

1488

% (offset, self._size))

1489

size = min(size, self._size - offset)

1490

ranges.append((offset, size))

1491

if not ranges:

1492

return

1493

elif bytes is not None:

1494

# already have the whole file

1495

data_ranges = [(start, bytes[start:start+_PAGE_SIZE])

1496

for start in xrange(0, len(bytes), _PAGE_SIZE)]

1497

elif self._file is None:

1498

data_ranges = self._transport.readv(self._name, ranges)

1499

else:

1500

data_ranges = []

1501

for offset, size in ranges:

1502

self._file.seek(offset)

1503

data_ranges.append((offset, self._file.read(size)))

1504

for offset, data in data_ranges:

1505

if offset == 0:

1506

# extract the header

1507

offset, data = self._parse_header_from_bytes(data)

1508

if len(data) == 0:

1509

continue

1510

bytes = zlib.decompress(data)

1511

if bytes.startswith(_LEAF_FLAG):

1512

node = _LeafNode(bytes, self._key_length, self.node_ref_lists)

1513

elif bytes.startswith(_INTERNAL_FLAG):

1514

node = _InternalNode(bytes)

1515

else:

1516

raise AssertionError("Unknown node type for %r" % bytes)

1517

yield offset / _PAGE_SIZE, node

1518

1519

def _signature(self):

1520

"""The file signature for this index type."""

1521

return _BTSIGNATURE

1522

1523

def validate(self):

1524

"""Validate that everything in the index can be accessed."""

1525

# just read and parse every node.

1526

self._get_root_node()

1527

if len(self._row_lengths) > 1:

1528

start_node = self._row_offsets[1]

1529

else:

1530

# We shouldn't be reading anything anyway

1531

start_node = 1

1532

node_end = self._row_offsets[-1]

1533

for node in self._read_nodes(range(start_node, node_end)):

1534

pass

1535

1536

1537

try:

1538

from bzrlib import _btree_serializer_pyx as _btree_serializer

1539

except ImportError, e:

1540

osutils.failed_to_load_extension(e)

1541

from bzrlib import _btree_serializer_py as _btree_serializer

Older »