/brz/remove-bazaar : revision 3763.8.14

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: John Arbash Meinel
Date: 2008-10-14 21:35:27 UTC
mto: This revision was merged to the branch mainline in revision 3805.
Revision ID: john@arbash-meinel.com-20081014213527-4j9uc93aq1qmn43b

Add in a shortcut when we haven't cached much yet.

Document the current algorithm more completely, including the proper
justification for the various steps.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chunk_writer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

dir.py

dulwich

dulwich/.bzrignore

dulwich/COPYING

dulwich/Makefile

dulwich/README

dulwich/bin

dulwich/bin/dul-daemon

dulwich/bin/dul-receive-pack

dulwich/bin/dul-upload-pack

dulwich/bin/dulwich

dulwich/docs

dulwich/docs/protocol.txt

dulwich/dulwich

dulwich/dulwich/__init__.py

dulwich/dulwich/client.py

dulwich/dulwich/commit.py

dulwich/dulwich/errors.py

dulwich/dulwich/objects.py

dulwich/dulwich/pack.py

dulwich/dulwich/protocol.py

dulwich/dulwich/repo.py

dulwich/dulwich/server.py

dulwich/dulwich/tests

dulwich/dulwich/tests/__init__.py

dulwich/dulwich/tests/data

dulwich/dulwich/tests/data/blobs

dulwich/dulwich/tests/data/blobs/6f670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/blobs/954a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/blobs/e69de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/commits

dulwich/dulwich/tests/data/commits/0d89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/commits/5dac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/commits/60dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/packs

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.idx

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.pack

dulwich/dulwich/tests/data/repos

dulwich/dulwich/tests/data/repos/a

dulwich/dulwich/tests/data/repos/a/.git

dulwich/dulwich/tests/data/repos/a/.git/HEAD

dulwich/dulwich/tests/data/repos/a/.git/index

dulwich/dulwich/tests/data/repos/a/.git/objects

dulwich/dulwich/tests/data/repos/a/.git/objects/2a

dulwich/dulwich/tests/data/repos/a/.git/objects/2a/72d929692c41d8554c07f6301757ba18a65d91

dulwich/dulwich/tests/data/repos/a/.git/objects/4e

dulwich/dulwich/tests/data/repos/a/.git/objects/4e/f30bbfe26431a69c3820d3a683df54d688f2ec

dulwich/dulwich/tests/data/repos/a/.git/objects/4f

dulwich/dulwich/tests/data/repos/a/.git/objects/4f/2e6529203aa6d44b5af6e3292c837ceda003f9

dulwich/dulwich/tests/data/repos/a/.git/objects/7d

dulwich/dulwich/tests/data/repos/a/.git/objects/7d/9a07d797595ef11344549b8d08198e48c15364

dulwich/dulwich/tests/data/repos/a/.git/objects/a2

dulwich/dulwich/tests/data/repos/a/.git/objects/a2/96d0bb611188cabb256919f36bc30117cca005

dulwich/dulwich/tests/data/repos/a/.git/objects/a9

dulwich/dulwich/tests/data/repos/a/.git/objects/a9/0fa2d900a17e99b433217e988c4eb4a2e9a097

dulwich/dulwich/tests/data/repos/a/.git/objects/ff

dulwich/dulwich/tests/data/repos/a/.git/objects/ff/d47d45845a8f6576491e1edb97e3fe6a850e7f

dulwich/dulwich/tests/data/repos/a/.git/objects/info

dulwich/dulwich/tests/data/repos/a/.git/objects/pack

dulwich/dulwich/tests/data/repos/a/.git/refs

dulwich/dulwich/tests/data/repos/a/.git/refs/heads

dulwich/dulwich/tests/data/repos/a/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/a/.git/refs/tags

dulwich/dulwich/tests/data/repos/a/a

dulwich/dulwich/tests/data/repos/a/b

dulwich/dulwich/tests/data/repos/a/c

dulwich/dulwich/tests/data/repos/ooo_merge

dulwich/dulwich/tests/data/repos/ooo_merge/.git

dulwich/dulwich/tests/data/repos/ooo_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/ooo_merge/.git/index

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38/74e9c60a6d149c44c928140f250d81e6381520

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76/01d7f6231db6a57f7bbb79ee52e4d462fd44d1

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2/a2766a2879c209ab1176e7e778b81ae422eeaa

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5/07291b64138b875c28e03469025b1ea20bc614

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9/e39b120c68182a4ba35349f832d0e4e61f485c

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb/5b0425c7ce46959bec94d54b9a157645e114f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/ooo_merge/a

dulwich/dulwich/tests/data/repos/ooo_merge/b

dulwich/dulwich/tests/data/repos/ooo_merge/c

dulwich/dulwich/tests/data/repos/simple_merge

dulwich/dulwich/tests/data/repos/simple_merge/.git

dulwich/dulwich/tests/data/repos/simple_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/simple_merge/.git/index

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d/89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b/6318f651a534b38f9c7aedeebbd56c1e896853

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c/ffe90e0a41ad3f5190079d7c8f036bde29cbe6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d/ac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60/dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab/64bbdcc51b170d21588e5c5d391ee5c0c96dfd

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4/bdad6549dfedf25d3b89d21f506aff575b28a7

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8/0c186a03f423a81b39df39dc87fd269736ca86

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/simple_merge/a

dulwich/dulwich/tests/data/repos/simple_merge/b

dulwich/dulwich/tests/data/repos/simple_merge/d

dulwich/dulwich/tests/data/repos/simple_merge/e

dulwich/dulwich/tests/data/trees

dulwich/dulwich/tests/data/trees/70c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/test_objects.py

dulwich/dulwich/tests/test_pack.py

dulwich/dulwich/tests/test_repository.py

dulwich/setup.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

remote.py

repository.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_ids.py

tests/test_repository.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""B+Tree indices"""

import array

import bisect

from bisect import bisect_right

from copy import deepcopy

import math

import struct

import tempfile

import zlib

from bzrlib import (

chunk_writer,

debug,

errors,

index,

lru_cache,

osutils,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

from bzrlib.transport import get_transport

_BTSIGNATURE = "B+Tree Graph Index 2\n"

_OPTION_ROW_LENGTHS = "row_lengths="

_LEAF_FLAG = "type=leaf\n"

_INTERNAL_FLAG = "type=internal\n"

_INTERNAL_OFFSET = "offset="

_RESERVED_HEADER_BYTES = 120

_PAGE_SIZE = 4096

# 4K per page: 4MB - 1000 entries

_NODE_CACHE_SIZE = 1000

class _BuilderRow(object):

"""The stored state accumulated while writing out a row in the index.

:ivar spool: A temporary file used to accumulate nodes for this row

in the tree.

:ivar nodes: The count of nodes emitted so far.

"""

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = tempfile.TemporaryFile()

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

skipped_bytes = padding

self.spool.writelines(byte_lines)

remainder = (self.spool.tell() + skipped_bytes) % _PAGE_SIZE

if remainder != 0:

raise AssertionError("incorrect node length: %d, %d"

% (self.spool.tell(), remainder))

self.nodes += 1

self.writer = None

class _InternalBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out internal rows."""

def finish_node(self, pad=True):

if not pad:

raise AssertionError("Must pad internal nodes only.")

_BuilderRow.finish_node(self)

class _LeafBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out a leaf rows."""

100

class BTreeBuilder(index.GraphIndexBuilder):

101

"""A Builder for B+Tree based Graph indices.

102

103

The resulting graph has the structure:

104

105

_SIGNATURE OPTIONS NODES

106

_SIGNATURE := 'B+Tree Graph Index 1' NEWLINE

107

OPTIONS := REF_LISTS KEY_ELEMENTS LENGTH

108

REF_LISTS := 'node_ref_lists=' DIGITS NEWLINE

109

KEY_ELEMENTS := 'key_elements=' DIGITS NEWLINE

110

LENGTH := 'len=' DIGITS NEWLINE

111

ROW_LENGTHS := 'row_lengths' DIGITS (COMMA DIGITS)*

112

NODES := NODE_COMPRESSED*

113

NODE_COMPRESSED:= COMPRESSED_BYTES{4096}

114

NODE_RAW := INTERNAL | LEAF

115

INTERNAL := INTERNAL_FLAG POINTERS

116

LEAF := LEAF_FLAG ROWS

117

KEY_ELEMENT := Not-whitespace-utf8

118

KEY := KEY_ELEMENT (NULL KEY_ELEMENT)*

119

ROWS := ROW*

120

ROW := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

121

ABSENT := 'a'

122

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

123

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

124

REFERENCE := KEY

125

VALUE := no-newline-no-null-bytes

126

"""

127

128

def __init__(self, reference_lists=0, key_elements=1, spill_at=100000):

129

"""See GraphIndexBuilder.__init__.

130

131

:param spill_at: Optional parameter controlling the maximum number

132

of nodes that BTreeBuilder will hold in memory.

133

"""

134

index.GraphIndexBuilder.__init__(self, reference_lists=reference_lists,

135

key_elements=key_elements)

136

self._spill_at = spill_at

137

self._backing_indices = []

138

# A map of {key: (node_refs, value)}

139

self._nodes = {}

140

# Indicate it hasn't been built yet

141

self._nodes_by_key = None

142

143

def add_node(self, key, value, references=()):

144

"""Add a node to the index.

145

146

If adding the node causes the builder to reach its spill_at threshold,

147

disk spilling will be triggered.

148

149

:param key: The key. keys are non-empty tuples containing

150

as many whitespace-free utf8 bytestrings as the key length

151

defined for this index.

152

:param references: An iterable of iterables of keys. Each is a

153

reference to another key.

154

:param value: The value to associate with the key. It may be any

155

bytes as long as it does not contain \0 or \n.

156

"""

157

# we don't care about absent_references

158

node_refs, _ = self._check_key_ref_value(key, references, value)

159

if key in self._nodes:

160

raise errors.BadIndexDuplicateKey(key, self)

161

self._nodes[key] = (node_refs, value)

162

self._keys.add(key)

163

if self._nodes_by_key is not None and self._key_length > 1:

164

self._update_nodes_by_key(key, value, node_refs)

165

if len(self._keys) < self._spill_at:

166

return

167

self._spill_mem_keys_to_disk()

168

169

def _spill_mem_keys_to_disk(self):

170

"""Write the in memory keys down to disk to cap memory consumption.

171

172

If we already have some keys written to disk, we will combine them so

173

as to preserve the sorted order. The algorithm for combining uses

174

powers of two. So on the first spill, write all mem nodes into a

175

single index. On the second spill, combine the mem nodes with the nodes

176

on disk to create a 2x sized disk index and get rid of the first index.

177

On the third spill, create a single new disk index, which will contain

178

the mem nodes, and preserve the existing 2x sized index. On the fourth,

179

combine mem with the first and second indexes, creating a new one of

180

size 4x. On the fifth create a single new one, etc.

181

"""

182

iterators_to_combine = [self._iter_mem_nodes()]

183

pos = -1

184

for pos, backing in enumerate(self._backing_indices):

185

if backing is None:

186

pos -= 1

187

break

188

iterators_to_combine.append(backing.iter_all_entries())

189

backing_pos = pos + 1

190

new_backing_file, size = \

191

self._write_nodes(self._iter_smallest(iterators_to_combine))

192

dir_path, base_name = osutils.split(new_backing_file.name)

193

# Note: The transport here isn't strictly needed, because we will use

194

# direct access to the new_backing._file object

195

new_backing = BTreeGraphIndex(get_transport(dir_path),

196

base_name, size)

197

# GC will clean up the file

198

new_backing._file = new_backing_file

199

if len(self._backing_indices) == backing_pos:

200

self._backing_indices.append(None)

201

self._backing_indices[backing_pos] = new_backing

202

for pos in range(backing_pos):

203

self._backing_indices[pos] = None

204

self._keys = set()

205

self._nodes = {}

206

self._nodes_by_key = None

207

208

def add_nodes(self, nodes):

209

"""Add nodes to the index.

210

211

:param nodes: An iterable of (key, node_refs, value) entries to add.

212

"""

213

if self.reference_lists:

214

for (key, value, node_refs) in nodes:

215

self.add_node(key, value, node_refs)

216

else:

217

for (key, value) in nodes:

218

self.add_node(key, value)

219

220

def _iter_mem_nodes(self):

221

"""Iterate over the nodes held in memory."""

222

nodes = self._nodes

223

if self.reference_lists:

224

for key in sorted(nodes):

225

references, value = nodes[key]

226

yield self, key, value, references

227

else:

228

for key in sorted(nodes):

229

references, value = nodes[key]

230

yield self, key, value

231

232

def _iter_smallest(self, iterators_to_combine):

233

if len(iterators_to_combine) == 1:

234

for value in iterators_to_combine[0]:

235

yield value

236

return

237

current_values = []

238

for iterator in iterators_to_combine:

239

try:

240

current_values.append(iterator.next())

241

except StopIteration:

242

current_values.append(None)

243

last = None

244

while True:

245

# Decorate candidates with the value to allow 2.4's min to be used.

246

candidates = [(item[1][1], item) for item

247

in enumerate(current_values) if item[1] is not None]

248

if not len(candidates):

249

return

250

selected = min(candidates)

251

# undecorate back to (pos, node)

252

selected = selected[1]

253

if last == selected[1][1]:

254

raise errors.BadIndexDuplicateKey(last, self)

255

last = selected[1][1]

256

# Yield, with self as the index

257

yield (self,) + selected[1][1:]

258

pos = selected[0]

259

try:

260

current_values[pos] = iterators_to_combine[pos].next()

261

except StopIteration:

262

current_values[pos] = None

263

264

def _add_key(self, string_key, line, rows):

265

"""Add a key to the current chunk.

266

267

:param string_key: The key to add.

268

:param line: The fully serialised key and value.

269

"""

270

if rows[-1].writer is None:

271

# opening a new leaf chunk;

272

for pos, internal_row in enumerate(rows[:-1]):

273

# flesh out any internal nodes that are needed to

274

# preserve the height of the tree

275

if internal_row.writer is None:

276

length = _PAGE_SIZE

277

if internal_row.nodes == 0:

278

length -= _RESERVED_HEADER_BYTES # padded

279

internal_row.writer = chunk_writer.ChunkWriter(length, 0)

280

internal_row.writer.write(_INTERNAL_FLAG)

281

internal_row.writer.write(_INTERNAL_OFFSET +

282

str(rows[pos + 1].nodes) + "\n")

283

# add a new leaf

284

length = _PAGE_SIZE

285

if rows[-1].nodes == 0:

286

length -= _RESERVED_HEADER_BYTES # padded

287

rows[-1].writer = chunk_writer.ChunkWriter(length)

288

rows[-1].writer.write(_LEAF_FLAG)

289

if rows[-1].writer.write(line):

290

# this key did not fit in the node:

291

rows[-1].finish_node()

292

key_line = string_key + "\n"

293

new_row = True

294

for row in reversed(rows[:-1]):

295

# Mark the start of the next node in the node above. If it

296

# doesn't fit then propogate upwards until we find one that

297

# it does fit into.

298

if row.writer.write(key_line):

299

row.finish_node()

300

else:

301

# We've found a node that can handle the pointer.

302

new_row = False

303

break

304

# If we reached the current root without being able to mark the

305

# division point, then we need a new root:

306

if new_row:

307

# We need a new row

308

if 'index' in debug.debug_flags:

309

trace.mutter('Inserting new global row.')

310

new_row = _InternalBuilderRow()

311

reserved_bytes = 0

312

rows.insert(0, new_row)

313

# This will be padded, hence the -100

314

new_row.writer = chunk_writer.ChunkWriter(

315

_PAGE_SIZE - _RESERVED_HEADER_BYTES,

316

reserved_bytes)

317

new_row.writer.write(_INTERNAL_FLAG)

318

new_row.writer.write(_INTERNAL_OFFSET +

319

str(rows[1].nodes - 1) + "\n")

320

new_row.writer.write(key_line)

321

self._add_key(string_key, line, rows)

322

323

def _write_nodes(self, node_iterator):

324

"""Write node_iterator out as a B+Tree.

325

326

:param node_iterator: An iterator of sorted nodes. Each node should

327

match the output given by iter_all_entries.

328

:return: A file handle for a temporary file containing a B+Tree for

329

the nodes.

330

"""

331

# The index rows - rows[0] is the root, rows[1] is the layer under it

332

# etc.

333

rows = []

334

# forward sorted by key. In future we may consider topological sorting,

335

# at the cost of table scans for direct lookup, or a second index for

336

# direct lookup

337

key_count = 0

338

# A stack with the number of nodes of each size. 0 is the root node

339

# and must always be 1 (if there are any nodes in the tree).

340

self.row_lengths = []

341

# Loop over all nodes adding them to the bottom row

342

# (rows[-1]). When we finish a chunk in a row,

343

# propogate the key that didn't fit (comes after the chunk) to the

344

# row above, transitively.

345

for node in node_iterator:

346

if key_count == 0:

347

# First key triggers the first row

348

rows.append(_LeafBuilderRow())

349

key_count += 1

350

string_key, line = _btree_serializer._flatten_node(node,

351

self.reference_lists)

352

self._add_key(string_key, line, rows)

353

for row in reversed(rows):

354

pad = (type(row) != _LeafBuilderRow)

355

row.finish_node(pad=pad)

356

result = tempfile.NamedTemporaryFile()

357

lines = [_BTSIGNATURE]

358

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

359

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

360

lines.append(_OPTION_LEN + str(key_count) + '\n')

361

row_lengths = [row.nodes for row in rows]

362

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

363

result.writelines(lines)

364

position = sum(map(len, lines))

365

root_row = True

366

if position > _RESERVED_HEADER_BYTES:

367

raise AssertionError("Could not fit the header in the"

368

" reserved space: %d > %d"

369

% (position, _RESERVED_HEADER_BYTES))

370

# write the rows out:

371

for row in rows:

372

reserved = _RESERVED_HEADER_BYTES # reserved space for first node

373

row.spool.flush()

374

row.spool.seek(0)

375

# copy nodes to the finalised file.

376

# Special case the first node as it may be prefixed

377

node = row.spool.read(_PAGE_SIZE)

378

result.write(node[reserved:])

379

result.write("\x00" * (reserved - position))

380

position = 0 # Only the root row actually has an offset

381

copied_len = osutils.pumpfile(row.spool, result)

382

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

383

if type(row) != _LeafBuilderRow:

384

raise AssertionError("Incorrect amount of data copied"

385

" expected: %d, got: %d"

386

% ((row.nodes - 1) * _PAGE_SIZE,

387

copied_len))

388

result.flush()

389

size = result.tell()

390

result.seek(0)

391

return result, size

392

393

def finish(self):

394

"""Finalise the index.

395

396

:return: A file handle for a temporary file containing the nodes added

397

to the index.

398

"""

399

return self._write_nodes(self.iter_all_entries())[0]

400

401

def iter_all_entries(self):

402

"""Iterate over all keys within the index

403

404

:return: An iterable of (index, key, reference_lists, value). There is no

405

defined order for the result iteration - it will be in the most

406

efficient order for the index (in this case dictionary hash order).

407

"""

408

if 'evil' in debug.debug_flags:

409

trace.mutter_callsite(3,

410

"iter_all_entries scales with size of history.")

411

# Doing serial rather than ordered would be faster; but this shouldn't

412

# be getting called routinely anyway.

413

iterators = [self._iter_mem_nodes()]

414

for backing in self._backing_indices:

415

if backing is not None:

416

iterators.append(backing.iter_all_entries())

417

if len(iterators) == 1:

418

return iterators[0]

419

return self._iter_smallest(iterators)

420

421

def iter_entries(self, keys):

422

"""Iterate over keys within the index.

423

424

:param keys: An iterable providing the keys to be retrieved.

425

:return: An iterable of (index, key, value, reference_lists). There is no

426

defined order for the result iteration - it will be in the most

427

efficient order for the index (keys iteration order in this case).

428

"""

429

keys = set(keys)

430

if self.reference_lists:

431

for key in keys.intersection(self._keys):

432

node = self._nodes[key]

433

yield self, key, node[1], node[0]

434

else:

435

for key in keys.intersection(self._keys):

436

node = self._nodes[key]

437

yield self, key, node[1]

438

keys.difference_update(self._keys)

439

for backing in self._backing_indices:

440

if backing is None:

441

continue

442

if not keys:

443

return

444

for node in backing.iter_entries(keys):

445

keys.remove(node[1])

446

yield (self,) + node[1:]

447

448

def iter_entries_prefix(self, keys):

449

"""Iterate over keys within the index using prefix matching.

450

451

Prefix matching is applied within the tuple of a key, not to within

452

the bytestring of each key element. e.g. if you have the keys ('foo',

453

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

454

only the former key is returned.

455

456

:param keys: An iterable providing the key prefixes to be retrieved.

457

Each key prefix takes the form of a tuple the length of a key, but

458

with the last N elements 'None' rather than a regular bytestring.

459

The first element cannot be 'None'.

460

:return: An iterable as per iter_all_entries, but restricted to the

461

keys with a matching prefix to those supplied. No additional keys

462

will be returned, and every match that is in the index will be

463

returned.

464

"""

465

# XXX: To much duplication with the GraphIndex class; consider finding

466

# a good place to pull out the actual common logic.

467

keys = set(keys)

468

if not keys:

469

return

470

for backing in self._backing_indices:

471

if backing is None:

472

continue

473

for node in backing.iter_entries_prefix(keys):

474

yield (self,) + node[1:]

475

if self._key_length == 1:

476

for key in keys:

477

# sanity check

478

if key[0] is None:

479

raise errors.BadIndexKey(key)

480

if len(key) != self._key_length:

481

raise errors.BadIndexKey(key)

482

try:

483

node = self._nodes[key]

484

except KeyError:

485

continue

486

if self.reference_lists:

487

yield self, key, node[1], node[0]

488

else:

489

yield self, key, node[1]

490

return

491

for key in keys:

492

# sanity check

493

if key[0] is None:

494

raise errors.BadIndexKey(key)

495

if len(key) != self._key_length:

496

raise errors.BadIndexKey(key)

497

# find what it refers to:

498

key_dict = self._get_nodes_by_key()

499

elements = list(key)

500

# find the subdict to return

501

try:

502

while len(elements) and elements[0] is not None:

503

key_dict = key_dict[elements[0]]

504

elements.pop(0)

505

except KeyError:

506

# a non-existant lookup.

507

continue

508

if len(elements):

509

dicts = [key_dict]

510

while dicts:

511

key_dict = dicts.pop(-1)

512

# can't be empty or would not exist

513

item, value = key_dict.iteritems().next()

514

if type(value) == dict:

515

# push keys

516

dicts.extend(key_dict.itervalues())

517

else:

518

# yield keys

519

for value in key_dict.itervalues():

520

yield (self, ) + value

521

else:

522

yield (self, ) + key_dict

523

524

def _get_nodes_by_key(self):

525

if self._nodes_by_key is None:

526

nodes_by_key = {}

527

if self.reference_lists:

528

for key, (references, value) in self._nodes.iteritems():

529

key_dict = nodes_by_key

530

for subkey in key[:-1]:

531

key_dict = key_dict.setdefault(subkey, {})

532

key_dict[key[-1]] = key, value, references

533

else:

534

for key, (references, value) in self._nodes.iteritems():

535

key_dict = nodes_by_key

536

for subkey in key[:-1]:

537

key_dict = key_dict.setdefault(subkey, {})

538

key_dict[key[-1]] = key, value

539

self._nodes_by_key = nodes_by_key

540

return self._nodes_by_key

541

542

def key_count(self):

543

"""Return an estimate of the number of keys in this index.

544

545

For InMemoryGraphIndex the estimate is exact.

546

"""

547

return len(self._keys) + sum(backing.key_count() for backing in

548

self._backing_indices if backing is not None)

549

550

def validate(self):

551

"""In memory index's have no known corruption at the moment."""

552

553

554

class _LeafNode(object):

555

"""A leaf node for a serialised B+Tree index."""

556

557

def __init__(self, bytes, key_length, ref_list_length):

558

"""Parse bytes to create a leaf node object."""

559

# splitlines mangles the \r delimiters.. don't use it.

560

self.keys = dict(_btree_serializer._parse_leaf_lines(bytes,

561

key_length, ref_list_length))

562

563

564

class _InternalNode(object):

565

"""An internal node for a serialised B+Tree index."""

566

567

def __init__(self, bytes):

568

"""Parse bytes to create an internal node object."""

569

# splitlines mangles the \r delimiters.. don't use it.

570

self.keys = self._parse_lines(bytes.split('\n'))

571

572

def _parse_lines(self, lines):

573

nodes = []

574

self.offset = int(lines[1][7:])

575

for line in lines[2:]:

576

if line == '':

577

break

578

nodes.append(tuple(line.split('\0')))

579

return nodes

580

581

582

class BTreeGraphIndex(object):

583

"""Access to nodes via the standard GraphIndex interface for B+Tree's.

584

585

Individual nodes are held in a LRU cache. This holds the root node in

586

memory except when very large walks are done.

587

"""

588

589

def __init__(self, transport, name, size):

590

"""Create a B+Tree index object on the index name.

591

592

:param transport: The transport to read data for the index from.

593

:param name: The file name of the index on transport.

594

:param size: Optional size of the index in bytes. This allows

595

compatibility with the GraphIndex API, as well as ensuring that

596

the initial read (to read the root node header) can be done

597

without over-reading even on empty indices, and on small indices

598

allows single-IO to read the entire index.

599

"""

600

self._transport = transport

601

self._name = name

602

self._size = size

603

self._file = None

604

self._recommended_pages = self._compute_recommended_pages()

605

self._root_node = None

606

# Default max size is 100,000 leave values

607

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

608

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

609

self._internal_node_cache = lru_cache.LRUCache()

610

self._key_count = None

611

self._row_lengths = None

612

self._row_offsets = None # Start of each row, [-1] is the end

613

614

def __eq__(self, other):

615

"""Equal when self and other were created with the same parameters."""

616

return (

617

type(self) == type(other) and

618

self._transport == other._transport and

619

self._name == other._name and

620

self._size == other._size)

621

622

def __ne__(self, other):

623

return not self.__eq__(other)

624

625

def _get_and_cache_nodes(self, nodes):

626

"""Read nodes and cache them in the lru.

627

628

The nodes list supplied is sorted and then read from disk, each node

629

being inserted it into the _node_cache.

630

631

Note: Asking for more nodes than the _node_cache can contain will

632

result in some of the results being immediately discarded, to prevent

633

this an assertion is raised if more nodes are asked for than are

634

cachable.

635

636

:return: A dict of {node_pos: node}

637

"""

638

found = {}

639

start_of_leaves = None

640

for node_pos, node in self._read_nodes(sorted(nodes)):

641

if node_pos == 0: # Special case

642

self._root_node = node

643

else:

644

if start_of_leaves is None:

645

start_of_leaves = self._row_offsets[-2]

646

if node_pos < start_of_leaves:

647

self._internal_node_cache.add(node_pos, node)

648

else:

649

self._leaf_node_cache.add(node_pos, node)

650

found[node_pos] = node

651

return found

652

653

def _compute_recommended_pages(self):

654

"""Given the transport's recommended_page_size, determine num pages."""

655

recommended_read = self._transport.recommended_page_size()

656

recommended_pages = int(math.ceil(recommended_read /

657

float(_PAGE_SIZE)))

658

return recommended_pages

659

660

def _compute_num_pages(self):

661

"""Determine the offset to the last page in this index."""

662

if self._size is None:

663

raise AssertionError('_compute_num_pages should not be called'

664

' when self._size is None')

665

if self._root_node is not None:

666

# This is the number of pages as defined by the header

667

return self._row_offsets[-1]

668

# This is the number of pages as defined by the size of the index. They

669

# should be indentical.

670

num_pages = int(math.ceil(self._size / float(_PAGE_SIZE)))

671

return num_pages

672

673

def _expand_nodes(self, node_indexes):

674

"""Find extra nodes to download.

675

676

The idea is that we always want to make big-enough requests (like 64kB

677

for http), so that we don't waste round trips. So given the entries

678

that we already have cached, and the new nodes being downloaded, figure

679

out what other pages we might want to read.

680

681

:param node_indexes: The nodes that have been requested to read.

682

:return: A new list of nodes to download

683

"""

684

if 'index' in debug.debug_flags:

685

trace.mutter('expanding: %s\tnodes: %s', self._name, node_indexes)

686

687

if len(node_indexes) >= self._recommended_pages:

688

# Don't add more, we are already requesting more than enough

689

if 'index' in debug.debug_flags:

690

trace.mutter(' not expanding large request (%s >= %s)',

691

len(node_indexes), self._recommended_pages)

692

return node_indexes

693

if self._size is None:

694

# Don't try anything, because we don't know where the file ends

695

if 'index' in debug.debug_flags:

696

trace.mutter(' not expanding without knowing index size')

697

return node_indexes

698

num_pages = self._compute_num_pages()

699

# The idea here is to get nodes "next to" the ones we are already

700

# getting.

701

cached_keys = self._get_cached_keys()

702

703

# If reading recommended_pages would read the rest of the index, just

704

# do so.

705

if num_pages - len(cached_keys) <= self._recommended_pages:

706

# Read whatever is left

707

if cached_keys:

708

expanded = [x for x in xrange(num_pages)

709

if x not in cached_keys]

710

else:

711

expanded = range(num_pages)

712

if 'index' in debug.debug_flags:

713

trace.mutter(' reading all unread pages: %s', expanded)

714

return expanded

715

716

if self._root_node is None:

717

# ATM on the first read of the root node of a large index, we don't

718

# bother pre-reading any other pages. This is because the

719

# likelyhood of actually reading interesting pages is very low.

720

# See doc/developers/btree_index_prefetch.txt for a discussion, and

721

# a possible implementation when we are guessing that the second

722

# layer index is small

723

final_nodes = node_indexes

724

else:

725

tree_depth = len(self._row_lengths)

726

if len(cached_keys) < tree_depth and len(node_indexes) == 1:

727

# We haven't read enough to justify expansion

728

# If we are only going to read the root node, and 1 leaf node,

729

# then it isn't worth expanding our request. Once we've read at

730

# least 2 nodes, then we are probably doing a search, and we

731

# start expanding our requests.

732

if 'index' in debug.debug_flags:

733

trace.mutter(' not expanding on first reads')

734

return node_indexes

735

736

# Expand requests to neighbors until we have at least

737

# recommended_pages to request. We only want to expand requests

738

# within a given layer. We cheat a little bit and assume all

739

# requests will be in the same layer. This is true given the

740

# current design, but if it changes this algorithm may perform

741

# oddly.

742

final_nodes = set(node_indexes)

743

first = end = None

744

new_tips = set(final_nodes)

745

while len(final_nodes) < self._recommended_pages and new_tips:

746

next_tips = set()

747

for pos in new_tips:

748

if first is None:

749

first, end = self._find_layer_first_and_end(pos)

750

previous = pos - 1

751

if (previous > 0

752

and previous not in cached_keys

753

and previous not in final_nodes

754

and previous >= first):

755

next_tips.add(previous)

756

after = pos + 1

757

if (after < num_pages

758

and after not in cached_keys

759

and after not in final_nodes

760

and after < end):

761

next_tips.add(after)

762

# This would keep us from going bigger than

763

# recommended_pages by only expanding the first nodes.

764

# However, if we are making a 'wide' request, it is

765

# reasonable to expand all points equally.

766

# if len(final_nodes) > recommended_pages:

767

# break

768

final_nodes.update(next_tips)

769

new_tips = next_tips

770

771

final_nodes = sorted(final_nodes)

772

if 'index' in debug.debug_flags:

773

trace.mutter('expanded: %s', final_nodes)

774

return final_nodes

775

776

def _find_layer_first_and_end(self, offset):

777

"""Find the start/stop nodes for the layer corresponding to offset.

778

779

:return: (first, end)

780

first is the first node in this layer

781

end is the first node of the next layer

782

"""

783

first = end = 0

784

for roffset in self._row_offsets:

785

first = end

786

end = roffset

787

if offset < roffset:

788

break

789

return first, end

790

791

def _get_cached_keys(self):

792

"""Determine what nodes we already have cached."""

793

cached_keys = set(self._internal_node_cache.keys())

794

cached_keys.update(self._leaf_node_cache.keys())

795

if self._root_node is not None:

796

cached_keys.add(0)

797

return cached_keys

798

799

def _get_root_node(self):

800

if self._root_node is None:

801

# We may not have a root node yet

802

self._get_internal_nodes([0])

803

return self._root_node

804

805

def _get_nodes(self, cache, node_indexes):

806

found = {}

807

needed = []

808

for idx in node_indexes:

809

if idx == 0 and self._root_node is not None:

810

found[0] = self._root_node

811

continue

812

try:

813

found[idx] = cache[idx]

814

except KeyError:

815

needed.append(idx)

816

if not needed:

817

return found

818

needed = self._expand_nodes(needed)

819

found.update(self._get_and_cache_nodes(needed))

820

return found

821

822

def _get_internal_nodes(self, node_indexes):

823

"""Get a node, from cache or disk.

824

825

After getting it, the node will be cached.

826

"""

827

return self._get_nodes(self._internal_node_cache, node_indexes)

828

829

def _get_leaf_nodes(self, node_indexes):

830

"""Get a bunch of nodes, from cache or disk."""

831

found = self._get_nodes(self._leaf_node_cache, node_indexes)

832

if self._leaf_value_cache is not None:

833

for node in found.itervalues():

834

for key, value in node.keys.iteritems():

835

if key in self._leaf_value_cache:

836

# Don't add the rest of the keys, we've seen this node

837

# before.

838

break

839

self._leaf_value_cache[key] = value

840

return found

841

842

def iter_all_entries(self):

843

"""Iterate over all keys within the index.

844

845

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

846

The former tuple is used when there are no reference lists in the

847

index, making the API compatible with simple key:value index types.

848

There is no defined order for the result iteration - it will be in

849

the most efficient order for the index.

850

"""

851

if 'evil' in debug.debug_flags:

852

trace.mutter_callsite(3,

853

"iter_all_entries scales with size of history.")

854

if not self.key_count():

855

return

856

start_of_leaves = self._row_offsets[-2]

857

end_of_leaves = self._row_offsets[-1]

858

needed_nodes = range(start_of_leaves, end_of_leaves)

859

# We iterate strictly in-order so that we can use this function

860

# for spilling index builds to disk.

861

if self.node_ref_lists:

862

for _, node in self._read_nodes(needed_nodes):

863

for key, (value, refs) in sorted(node.keys.items()):

864

yield (self, key, value, refs)

865

else:

866

for _, node in self._read_nodes(needed_nodes):

867

for key, (value, refs) in sorted(node.keys.items()):

868

yield (self, key, value)

869

870

@staticmethod

871

def _multi_bisect_right(in_keys, fixed_keys):

872

"""Find the positions where each 'in_key' would fit in fixed_keys.

873

874

This is equivalent to doing "bisect_right" on each in_key into

875

fixed_keys

876

877

:param in_keys: A sorted list of keys to match with fixed_keys

878

:param fixed_keys: A sorted list of keys to match against

879

:return: A list of (integer position, [key list]) tuples.

880

"""

881

if not in_keys:

882

return []

883

if not fixed_keys:

884

# no pointers in the fixed_keys list, which means everything must

885

# fall to the left.

886

return [(0, in_keys)]

887

888

# TODO: Iterating both lists will generally take M + N steps

889

# Bisecting each key will generally take M * log2 N steps.

890

# If we had an efficient way to compare, we could pick the method

891

# based on which has the fewer number of steps.

892

# There is also the argument that bisect_right is a compiled

893

# function, so there is even more to be gained.

894

# iter_steps = len(in_keys) + len(fixed_keys)

895

# bisect_steps = len(in_keys) * math.log(len(fixed_keys), 2)

896

if len(in_keys) == 1: # Bisect will always be faster for M = 1

897

return [(bisect_right(fixed_keys, in_keys[0]), in_keys)]

898

# elif bisect_steps < iter_steps:

899

# offsets = {}

900

# for key in in_keys:

901

# offsets.setdefault(bisect_right(fixed_keys, key),

902

# []).append(key)

903

# return [(o, offsets[o]) for o in sorted(offsets)]

904

in_keys_iter = iter(in_keys)

905

fixed_keys_iter = enumerate(fixed_keys)

906

cur_in_key = in_keys_iter.next()

907

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

908

909

class InputDone(Exception): pass

910

class FixedDone(Exception): pass

911

912

output = []

913

cur_out = []

914

915

# TODO: Another possibility is that rather than iterating on each side,

916

# we could use a combination of bisecting and iterating. For

917

# example, while cur_in_key < fixed_key, bisect to find its

918

# point, then iterate all matching keys, then bisect (restricted

919

# to only the remainder) for the next one, etc.

920

try:

921

while True:

922

if cur_in_key < cur_fixed_key:

923

cur_keys = []

924

cur_out = (cur_fixed_offset, cur_keys)

925

output.append(cur_out)

926

while cur_in_key < cur_fixed_key:

927

cur_keys.append(cur_in_key)

928

try:

929

cur_in_key = in_keys_iter.next()

930

except StopIteration:

931

raise InputDone

932

# At this point cur_in_key must be >= cur_fixed_key

933

# step the cur_fixed_key until we pass the cur key, or walk off

934

# the end

935

while cur_in_key >= cur_fixed_key:

936

try:

937

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

938

except StopIteration:

939

raise FixedDone

940

except InputDone:

941

# We consumed all of the input, nothing more to do

942

pass

943

except FixedDone:

944

# There was some input left, but we consumed all of fixed, so we

945

# have to add one more for the tail

946

cur_keys = [cur_in_key]

947

cur_keys.extend(in_keys_iter)

948

cur_out = (len(fixed_keys), cur_keys)

949

output.append(cur_out)

950

return output

951

952

def iter_entries(self, keys):

953

"""Iterate over keys within the index.

954

955

:param keys: An iterable providing the keys to be retrieved.

956

:return: An iterable as per iter_all_entries, but restricted to the

957

keys supplied. No additional keys will be returned, and every

958

key supplied that is in the index will be returned.

959

"""

960

# 6 seconds spent in miss_torture using the sorted() line.

961

# Even with out of order disk IO it seems faster not to sort it when

962

# large queries are being made.

963

# However, now that we are doing multi-way bisecting, we need the keys

964

# in sorted order anyway. We could change the multi-way code to not

965

# require sorted order. (For example, it bisects for the first node,

966

# does an in-order search until a key comes before the current point,

967

# which it then bisects for, etc.)

968

keys = frozenset(keys)

969

if not keys:

970

return

971

972

if not self.key_count():

973

return

974

975

needed_keys = []

976

if self._leaf_value_cache is None:

977

needed_keys = keys

978

else:

979

for key in keys:

980

value = self._leaf_value_cache.get(key, None)

981

if value is not None:

982

# This key is known not to be here, skip it

983

value, refs = value

984

if self.node_ref_lists:

985

yield (self, key, value, refs)

986

else:

987

yield (self, key, value)

988

else:

989

needed_keys.append(key)

990

991

last_key = None

992

needed_keys = keys

993

if not needed_keys:

994

return

995

# 6 seconds spent in miss_torture using the sorted() line.

996

# Even with out of order disk IO it seems faster not to sort it when

997

# large queries are being made.

998

needed_keys = sorted(needed_keys)

999

1000

nodes_and_keys = [(0, needed_keys)]

1001

1002

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1003

node_indexes = [idx for idx, s_keys in nodes_and_keys]

1004

nodes = self._get_internal_nodes(node_indexes)

1005

1006

next_nodes_and_keys = []

1007

for node_index, sub_keys in nodes_and_keys:

1008

node = nodes[node_index]

1009

positions = self._multi_bisect_right(sub_keys, node.keys)

1010

node_offset = next_row_start + node.offset

1011

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1012

for pos, s_keys in positions])

1013

nodes_and_keys = next_nodes_and_keys

1014

# We should now be at the _LeafNodes

1015

node_indexes = [idx for idx, s_keys in nodes_and_keys]

1016

1017

# TODO: We may *not* want to always read all the nodes in one

1018

# big go. Consider setting a max size on this.

1019

1020

nodes = self._get_leaf_nodes(node_indexes)

1021

for node_index, sub_keys in nodes_and_keys:

1022

if not sub_keys:

1023

continue

1024

node = nodes[node_index]

1025

for next_sub_key in sub_keys:

1026

if next_sub_key in node.keys:

1027

value, refs = node.keys[next_sub_key]

1028

if self.node_ref_lists:

1029

yield (self, next_sub_key, value, refs)

1030

else:

1031

yield (self, next_sub_key, value)

1032

1033

def iter_entries_prefix(self, keys):

1034

"""Iterate over keys within the index using prefix matching.

1035

1036

Prefix matching is applied within the tuple of a key, not to within

1037

the bytestring of each key element. e.g. if you have the keys ('foo',

1038

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1039

only the former key is returned.

1040

1041

WARNING: Note that this method currently causes a full index parse

1042

unconditionally (which is reasonably appropriate as it is a means for

1043

thunking many small indices into one larger one and still supplies

1044

iter_all_entries at the thunk layer).

1045

1046

:param keys: An iterable providing the key prefixes to be retrieved.

1047

Each key prefix takes the form of a tuple the length of a key, but

1048

with the last N elements 'None' rather than a regular bytestring.

1049

The first element cannot be 'None'.

1050

:return: An iterable as per iter_all_entries, but restricted to the

1051

keys with a matching prefix to those supplied. No additional keys

1052

will be returned, and every match that is in the index will be

1053

returned.

1054

"""

1055

keys = sorted(set(keys))

1056

if not keys:

1057

return

1058

# Load if needed to check key lengths

1059

if self._key_count is None:

1060

self._get_root_node()

1061

# TODO: only access nodes that can satisfy the prefixes we are looking

1062

# for. For now, to meet API usage (as this function is not used by

1063

# current bzrlib) just suck the entire index and iterate in memory.

1064

nodes = {}

1065

if self.node_ref_lists:

1066

if self._key_length == 1:

1067

for _1, key, value, refs in self.iter_all_entries():

1068

nodes[key] = value, refs

1069

else:

1070

nodes_by_key = {}

1071

for _1, key, value, refs in self.iter_all_entries():

1072

key_value = key, value, refs

1073

# For a key of (foo, bar, baz) create

1074

# _nodes_by_key[foo][bar][baz] = key_value

1075

key_dict = nodes_by_key

1076

for subkey in key[:-1]:

1077

key_dict = key_dict.setdefault(subkey, {})

1078

key_dict[key[-1]] = key_value

1079

else:

1080

if self._key_length == 1:

1081

for _1, key, value in self.iter_all_entries():

1082

nodes[key] = value

1083

else:

1084

nodes_by_key = {}

1085

for _1, key, value in self.iter_all_entries():

1086

key_value = key, value

1087

# For a key of (foo, bar, baz) create

1088

# _nodes_by_key[foo][bar][baz] = key_value

1089

key_dict = nodes_by_key

1090

for subkey in key[:-1]:

1091

key_dict = key_dict.setdefault(subkey, {})

1092

key_dict[key[-1]] = key_value

1093

if self._key_length == 1:

1094

for key in keys:

1095

# sanity check

1096

if key[0] is None:

1097

raise errors.BadIndexKey(key)

1098

if len(key) != self._key_length:

1099

raise errors.BadIndexKey(key)

1100

try:

1101

if self.node_ref_lists:

1102

value, node_refs = nodes[key]

1103

yield self, key, value, node_refs

1104

else:

1105

yield self, key, nodes[key]

1106

except KeyError:

1107

pass

1108

return

1109

for key in keys:

1110

# sanity check

1111

if key[0] is None:

1112

raise errors.BadIndexKey(key)

1113

if len(key) != self._key_length:

1114

raise errors.BadIndexKey(key)

1115

# find what it refers to:

1116

key_dict = nodes_by_key

1117

elements = list(key)

1118

# find the subdict whose contents should be returned.

1119

try:

1120

while len(elements) and elements[0] is not None:

1121

key_dict = key_dict[elements[0]]

1122

elements.pop(0)

1123

except KeyError:

1124

# a non-existant lookup.

1125

continue

1126

if len(elements):

1127

dicts = [key_dict]

1128

while dicts:

1129

key_dict = dicts.pop(-1)

1130

# can't be empty or would not exist

1131

item, value = key_dict.iteritems().next()

1132

if type(value) == dict:

1133

# push keys

1134

dicts.extend(key_dict.itervalues())

1135

else:

1136

# yield keys

1137

for value in key_dict.itervalues():

1138

# each value is the key:value:node refs tuple

1139

# ready to yield.

1140

yield (self, ) + value

1141

else:

1142

# the last thing looked up was a terminal element

1143

yield (self, ) + key_dict

1144

1145

def key_count(self):

1146

"""Return an estimate of the number of keys in this index.

1147

1148

For BTreeGraphIndex the estimate is exact as it is contained in the

1149

header.

1150

"""

1151

if self._key_count is None:

1152

self._get_root_node()

1153

return self._key_count

1154

1155

def _compute_row_offsets(self):

1156

"""Fill out the _row_offsets attribute based on _row_lengths."""

1157

offsets = []

1158

row_offset = 0

1159

for row in self._row_lengths:

1160

offsets.append(row_offset)

1161

row_offset += row

1162

offsets.append(row_offset)

1163

self._row_offsets = offsets

1164

1165

def _parse_header_from_bytes(self, bytes):

1166

"""Parse the header from a region of bytes.

1167

1168

:param bytes: The data to parse.

1169

:return: An offset, data tuple such as readv yields, for the unparsed

1170

data. (which may be of length 0).

1171

"""

1172

signature = bytes[0:len(self._signature())]

1173

if not signature == self._signature():

1174

raise errors.BadIndexFormatSignature(self._name, BTreeGraphIndex)

1175

lines = bytes[len(self._signature()):].splitlines()

1176

options_line = lines[0]

1177

if not options_line.startswith(_OPTION_NODE_REFS):

1178

raise errors.BadIndexOptions(self)

1179

try:

1180

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

1181

except ValueError:

1182

raise errors.BadIndexOptions(self)

1183

options_line = lines[1]

1184

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

1185

raise errors.BadIndexOptions(self)

1186

try:

1187

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

1188

except ValueError:

1189

raise errors.BadIndexOptions(self)

1190

options_line = lines[2]

1191

if not options_line.startswith(_OPTION_LEN):

1192

raise errors.BadIndexOptions(self)

1193

try:

1194

self._key_count = int(options_line[len(_OPTION_LEN):])

1195

except ValueError:

1196

raise errors.BadIndexOptions(self)

1197

options_line = lines[3]

1198

if not options_line.startswith(_OPTION_ROW_LENGTHS):

1199

raise errors.BadIndexOptions(self)

1200

try:

1201

self._row_lengths = map(int, [length for length in

1202

options_line[len(_OPTION_ROW_LENGTHS):].split(',')

1203

if len(length)])

1204

except ValueError:

1205

raise errors.BadIndexOptions(self)

1206

self._compute_row_offsets()

1207

1208

# calculate the bytes we have processed

1209

header_end = (len(signature) + sum(map(len, lines[0:4])) + 4)

1210

return header_end, bytes[header_end:]

1211

1212

def _read_nodes(self, nodes):

1213

"""Read some nodes from disk into the LRU cache.

1214

1215

This performs a readv to get the node data into memory, and parses each

1216

node, the yields it to the caller. The nodes are requested in the

1217

supplied order. If possible doing sort() on the list before requesting

1218

a read may improve performance.

1219

1220

:param nodes: The nodes to read. 0 - first node, 1 - second node etc.

1221

:return: None

1222

"""

1223

ranges = []

1224

for index in nodes:

1225

offset = index * _PAGE_SIZE

1226

size = _PAGE_SIZE

1227

if index == 0:

1228

# Root node - special case

1229

if self._size:

1230

size = min(_PAGE_SIZE, self._size)

1231

else:

1232

stream = self._transport.get(self._name)

1233

start = stream.read(_PAGE_SIZE)

1234

# Avoid doing this again

1235

self._size = len(start)

1236

size = min(_PAGE_SIZE, self._size)

1237

else:

1238

if offset > self._size:

1239

raise AssertionError('tried to read past the end'

1240

' of the file %s > %s'

1241

% (offset, self._size))

1242

size = min(size, self._size - offset)

1243

ranges.append((offset, size))

1244

if not ranges:

1245

return

1246

if self._file is None:

1247

data_ranges = self._transport.readv(self._name, ranges)

1248

else:

1249

data_ranges = []

1250

for offset, size in ranges:

1251

self._file.seek(offset)

1252

data_ranges.append((offset, self._file.read(size)))

1253

for offset, data in data_ranges:

1254

if offset == 0:

1255

# extract the header

1256

offset, data = self._parse_header_from_bytes(data)

1257

if len(data) == 0:

1258

continue

1259

bytes = zlib.decompress(data)

1260

if bytes.startswith(_LEAF_FLAG):

1261

node = _LeafNode(bytes, self._key_length, self.node_ref_lists)

1262

elif bytes.startswith(_INTERNAL_FLAG):

1263

node = _InternalNode(bytes)

1264

else:

1265

raise AssertionError("Unknown node type for %r" % bytes)

1266

yield offset / _PAGE_SIZE, node

1267

1268

def _signature(self):

1269

"""The file signature for this index type."""

1270

return _BTSIGNATURE

1271

1272

def validate(self):

1273

"""Validate that everything in the index can be accessed."""

1274

# just read and parse every node.

1275

self._get_root_node()

1276

if len(self._row_lengths) > 1:

1277

start_node = self._row_offsets[1]

1278

else:

1279

# We shouldn't be reading anything anyway

1280

start_node = 1

1281

node_end = self._row_offsets[-1]

1282

for node in self._read_nodes(range(start_node, node_end)):

1283

pass

1284

1285

1286

try:

1287

from bzrlib import _btree_serializer_c as _btree_serializer

1288

except ImportError:

1289

from bzrlib import _btree_serializer_py as _btree_serializer

Older »