/brz/remove-bazaar : revision 3741

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/knit.py

Committer: Canonical.com Patch Queue Manager
Date: 2008-09-26 05:47:03 UTC
mfrom: (3696.5.4 integration)
Revision ID: pqm@pqm.ubuntu.com-20080926054703-nxn5f1h7z7gvur96

(robertc) Improve the handling of the sha1 cache by updating it
during commit and avoiding some of the sha generation during
iter_changes. (Robert Collins)

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chunk_writer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

INSTALL

Makefile

README

TODO

__init__.py

branch.py

dir.py

dulwich

dulwich/.bzrignore

dulwich/COPYING

dulwich/Makefile

dulwich/README

dulwich/bin

dulwich/bin/dul-daemon

dulwich/bin/dul-receive-pack

dulwich/bin/dul-upload-pack

dulwich/bin/dulwich

dulwich/docs

dulwich/docs/protocol.txt

dulwich/dulwich

dulwich/dulwich/__init__.py

dulwich/dulwich/client.py

dulwich/dulwich/commit.py

dulwich/dulwich/errors.py

dulwich/dulwich/objects.py

dulwich/dulwich/pack.py

dulwich/dulwich/protocol.py

dulwich/dulwich/repo.py

dulwich/dulwich/server.py

dulwich/dulwich/tests

dulwich/dulwich/tests/__init__.py

dulwich/dulwich/tests/data

dulwich/dulwich/tests/data/blobs

dulwich/dulwich/tests/data/blobs/6f670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/blobs/954a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/blobs/e69de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/commits

dulwich/dulwich/tests/data/commits/0d89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/commits/5dac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/commits/60dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/packs

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.idx

dulwich/dulwich/tests/data/packs/pack-bc63ddad95e7321ee734ea11a7a62d314e0d7481.pack

dulwich/dulwich/tests/data/repos

dulwich/dulwich/tests/data/repos/a

dulwich/dulwich/tests/data/repos/a/.git

dulwich/dulwich/tests/data/repos/a/.git/HEAD

dulwich/dulwich/tests/data/repos/a/.git/index

dulwich/dulwich/tests/data/repos/a/.git/objects

dulwich/dulwich/tests/data/repos/a/.git/objects/2a

dulwich/dulwich/tests/data/repos/a/.git/objects/2a/72d929692c41d8554c07f6301757ba18a65d91

dulwich/dulwich/tests/data/repos/a/.git/objects/4e

dulwich/dulwich/tests/data/repos/a/.git/objects/4e/f30bbfe26431a69c3820d3a683df54d688f2ec

dulwich/dulwich/tests/data/repos/a/.git/objects/4f

dulwich/dulwich/tests/data/repos/a/.git/objects/4f/2e6529203aa6d44b5af6e3292c837ceda003f9

dulwich/dulwich/tests/data/repos/a/.git/objects/7d

dulwich/dulwich/tests/data/repos/a/.git/objects/7d/9a07d797595ef11344549b8d08198e48c15364

dulwich/dulwich/tests/data/repos/a/.git/objects/a2

dulwich/dulwich/tests/data/repos/a/.git/objects/a2/96d0bb611188cabb256919f36bc30117cca005

dulwich/dulwich/tests/data/repos/a/.git/objects/a9

dulwich/dulwich/tests/data/repos/a/.git/objects/a9/0fa2d900a17e99b433217e988c4eb4a2e9a097

dulwich/dulwich/tests/data/repos/a/.git/objects/ff

dulwich/dulwich/tests/data/repos/a/.git/objects/ff/d47d45845a8f6576491e1edb97e3fe6a850e7f

dulwich/dulwich/tests/data/repos/a/.git/objects/info

dulwich/dulwich/tests/data/repos/a/.git/objects/pack

dulwich/dulwich/tests/data/repos/a/.git/refs

dulwich/dulwich/tests/data/repos/a/.git/refs/heads

dulwich/dulwich/tests/data/repos/a/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/a/.git/refs/tags

dulwich/dulwich/tests/data/repos/a/a

dulwich/dulwich/tests/data/repos/a/b

dulwich/dulwich/tests/data/repos/a/c

dulwich/dulwich/tests/data/repos/ooo_merge

dulwich/dulwich/tests/data/repos/ooo_merge/.git

dulwich/dulwich/tests/data/repos/ooo_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/ooo_merge/.git/index

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/38/74e9c60a6d149c44c928140f250d81e6381520

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/76/01d7f6231db6a57f7bbb79ee52e4d462fd44d1

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/b2/a2766a2879c209ab1176e7e778b81ae422eeaa

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f5/07291b64138b875c28e03469025b1ea20bc614

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/f9/e39b120c68182a4ba35349f832d0e4e61f485c

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/fb/5b0425c7ce46959bec94d54b9a157645e114f5

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/ooo_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/ooo_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/ooo_merge/a

dulwich/dulwich/tests/data/repos/ooo_merge/b

dulwich/dulwich/tests/data/repos/ooo_merge/c

dulwich/dulwich/tests/data/repos/simple_merge

dulwich/dulwich/tests/data/repos/simple_merge/.git

dulwich/dulwich/tests/data/repos/simple_merge/.git/HEAD

dulwich/dulwich/tests/data/repos/simple_merge/.git/index

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/0d/89f20333fbb1d2f3a94da77f4981373d8f4310

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/1b/6318f651a534b38f9c7aedeebbd56c1e896853

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/29/69be3e8ee1c0222396a5611407e4769f14e54b

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/4c/ffe90e0a41ad3f5190079d7c8f036bde29cbe6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/5d/ac377bdded4c9aeb8dff595f0faeebcc8498cc

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/60/dacdc733de308bb77bb76ce0fb0f9b44c9769e

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/6f/670c0fb53f9463760b7295fbb814e965fb20c8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/70/c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/90/182552c4a85a45ec2a835cadc3451bebdfe870

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/95/4a536f7819d40e6f637f849ee187dd10066349

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/ab/64bbdcc51b170d21588e5c5d391ee5c0c96dfd

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d4/bdad6549dfedf25d3b89d21f506aff575b28a7

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/d8/0c186a03f423a81b39df39dc87fd269736ca86

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/info

dulwich/dulwich/tests/data/repos/simple_merge/.git/objects/pack

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/heads/master

dulwich/dulwich/tests/data/repos/simple_merge/.git/refs/tags

dulwich/dulwich/tests/data/repos/simple_merge/a

dulwich/dulwich/tests/data/repos/simple_merge/b

dulwich/dulwich/tests/data/repos/simple_merge/d

dulwich/dulwich/tests/data/repos/simple_merge/e

dulwich/dulwich/tests/data/trees

dulwich/dulwich/tests/data/trees/70c190eb48fa8bbb50ddc692a17b44cb781af7f6

dulwich/dulwich/tests/test_objects.py

dulwich/dulwich/tests/test_pack.py

dulwich/dulwich/tests/test_repository.py

dulwich/setup.py

errors.py

fetch.py

foreign

foreign/.bzrignore

foreign/TODO

foreign/__init__.py

foreign/test_versionedfiles.py

foreign/upgrade.py

foreign/versionedfiles.py

mapping.py

remote.py

repository.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_dir.py

tests/test_ids.py

tests/test_repository.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/knit.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Knit versionedfile implementation.

A knit is a versioned file implementation that supports efficient append only

updates.

Knit file layout:

lifeless: the data file is made up of "delta records". each delta record has a delta header

that contains; (1) a version id, (2) the size of the delta (in lines), and (3) the digest of

the -expanded data- (ie, the delta applied to the parent). the delta also ends with a

end-marker; simply "end VERSION"

delta can be line or full contents.a

... the 8's there are the index number of the annotation.

version robertc@robertcollins.net-20051003014215-ee2990904cc4c7ad 7 c7d23b2a5bd6ca00e8e266cec0ec228158ee9f9e

59,59,3

8 if ie.executable:

8 e.set('executable', 'yes')

130,130,2

8 if elt.get('executable') == 'yes':

8 ie.executable = True

end robertc@robertcollins.net-20051003014215-ee2990904cc4c7ad

whats in an index:

09:33 < jrydberg> lifeless: each index is made up of a tuple of; version id, options, position, size, parents

09:33 < jrydberg> lifeless: the parents are currently dictionary compressed

09:33 < jrydberg> lifeless: (meaning it currently does not support ghosts)

09:33 < lifeless> right

09:33 < jrydberg> lifeless: the position and size is the range in the data file

so the index sequence is the dictionary compressed sequence number used

in the deltas to provide line annotation

"""

# TODOS:

# 10:16 < lifeless> make partial index writes safe

# 10:16 < lifeless> implement 'knit.check()' like weave.check()

# 10:17 < lifeless> record known ghosts so we can detect when they are filled in rather than the current 'reweave

# always' approach.

# move sha1 out of the content so that join is faster at verifying parents

# record content length ?

from cStringIO import StringIO

from itertools import izip, chain

import operator

import os

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

annotate,

debug,

diff,

graph as _mod_graph,

index as _mod_index,

lru_cache,

pack,

progress,

trace,

tsort,

tuned_gzip,

)

""")

from bzrlib import (

errors,

osutils,

patiencediff,

)

from bzrlib.errors import (

FileExists,

NoSuchFile,

KnitError,

InvalidRevisionId,

KnitCorrupt,

KnitHeaderError,

RevisionNotPresent,

RevisionAlreadyPresent,

)

from bzrlib.osutils import (

100

contains_whitespace,

101

contains_linebreaks,

102

sha_string,

103

sha_strings,

104

split_lines,

105

)

106

from bzrlib.versionedfile import (

107

AbsentContentFactory,

108

adapter_registry,

109

ConstantMapper,

110

ContentFactory,

111

FulltextContentFactory,

112

VersionedFile,

113

VersionedFiles,

114

)

115

116

117

# TODO: Split out code specific to this format into an associated object.

118

119

# TODO: Can we put in some kind of value to check that the index and data

120

# files belong together?

121

122

# TODO: accommodate binaries, perhaps by storing a byte count

123

124

# TODO: function to check whole file

125

126

# TODO: atomically append data, then measure backwards from the cursor

127

# position after writing to work out where it was located. we may need to

128

# bypass python file buffering.

129

130

DATA_SUFFIX = '.knit'

131

INDEX_SUFFIX = '.kndx'

132

133

134

class KnitAdapter(object):

135

"""Base class for knit record adaption."""

136

137

def __init__(self, basis_vf):

138

"""Create an adapter which accesses full texts from basis_vf.

139

140

:param basis_vf: A versioned file to access basis texts of deltas from.

141

May be None for adapters that do not need to access basis texts.

142

"""

143

self._data = KnitVersionedFiles(None, None)

144

self._annotate_factory = KnitAnnotateFactory()

145

self._plain_factory = KnitPlainFactory()

146

self._basis_vf = basis_vf

147

148

149

class FTAnnotatedToUnannotated(KnitAdapter):

150

"""An adapter from FT annotated knits to unannotated ones."""

151

152

def get_bytes(self, factory, annotated_compressed_bytes):

153

rec, contents = \

154

self._data._parse_record_unchecked(annotated_compressed_bytes)

155

content = self._annotate_factory.parse_fulltext(contents, rec[1])

156

size, bytes = self._data._record_to_data((rec[1],), rec[3], content.text())

157

return bytes

158

159

160

class DeltaAnnotatedToUnannotated(KnitAdapter):

161

"""An adapter for deltas from annotated to unannotated."""

162

163

def get_bytes(self, factory, annotated_compressed_bytes):

164

rec, contents = \

165

self._data._parse_record_unchecked(annotated_compressed_bytes)

166

delta = self._annotate_factory.parse_line_delta(contents, rec[1],

167

plain=True)

168

contents = self._plain_factory.lower_line_delta(delta)

169

size, bytes = self._data._record_to_data((rec[1],), rec[3], contents)

170

return bytes

171

172

173

class FTAnnotatedToFullText(KnitAdapter):

174

"""An adapter from FT annotated knits to unannotated ones."""

175

176

def get_bytes(self, factory, annotated_compressed_bytes):

177

rec, contents = \

178

self._data._parse_record_unchecked(annotated_compressed_bytes)

179

content, delta = self._annotate_factory.parse_record(factory.key[-1],

180

contents, factory._build_details, None)

181

return ''.join(content.text())

182

183

184

class DeltaAnnotatedToFullText(KnitAdapter):

185

"""An adapter for deltas from annotated to unannotated."""

186

187

def get_bytes(self, factory, annotated_compressed_bytes):

188

rec, contents = \

189

self._data._parse_record_unchecked(annotated_compressed_bytes)

190

delta = self._annotate_factory.parse_line_delta(contents, rec[1],

191

plain=True)

192

compression_parent = factory.parents[0]

193

basis_entry = self._basis_vf.get_record_stream(

194

[compression_parent], 'unordered', True).next()

195

if basis_entry.storage_kind == 'absent':

196

raise errors.RevisionNotPresent(compression_parent, self._basis_vf)

197

basis_lines = split_lines(basis_entry.get_bytes_as('fulltext'))

198

# Manually apply the delta because we have one annotated content and

199

# one plain.

200

basis_content = PlainKnitContent(basis_lines, compression_parent)

201

basis_content.apply_delta(delta, rec[1])

202

basis_content._should_strip_eol = factory._build_details[1]

203

return ''.join(basis_content.text())

204

205

206

class FTPlainToFullText(KnitAdapter):

207

"""An adapter from FT plain knits to unannotated ones."""

208

209

def get_bytes(self, factory, compressed_bytes):

210

rec, contents = \

211

self._data._parse_record_unchecked(compressed_bytes)

212

content, delta = self._plain_factory.parse_record(factory.key[-1],

213

contents, factory._build_details, None)

214

return ''.join(content.text())

215

216

217

class DeltaPlainToFullText(KnitAdapter):

218

"""An adapter for deltas from annotated to unannotated."""

219

220

def get_bytes(self, factory, compressed_bytes):

221

rec, contents = \

222

self._data._parse_record_unchecked(compressed_bytes)

223

delta = self._plain_factory.parse_line_delta(contents, rec[1])

224

compression_parent = factory.parents[0]

225

# XXX: string splitting overhead.

226

basis_entry = self._basis_vf.get_record_stream(

227

[compression_parent], 'unordered', True).next()

228

if basis_entry.storage_kind == 'absent':

229

raise errors.RevisionNotPresent(compression_parent, self._basis_vf)

230

basis_lines = split_lines(basis_entry.get_bytes_as('fulltext'))

231

basis_content = PlainKnitContent(basis_lines, compression_parent)

232

# Manually apply the delta because we have one annotated content and

233

# one plain.

234

content, _ = self._plain_factory.parse_record(rec[1], contents,

235

factory._build_details, basis_content)

236

return ''.join(content.text())

237

238

239

class KnitContentFactory(ContentFactory):

240

"""Content factory for streaming from knits.

241

242

:seealso ContentFactory:

243

"""

244

245

def __init__(self, key, parents, build_details, sha1, raw_record,

246

annotated, knit=None):

247

"""Create a KnitContentFactory for key.

248

249

:param key: The key.

250

:param parents: The parents.

251

:param build_details: The build details as returned from

252

get_build_details.

253

:param sha1: The sha1 expected from the full text of this object.

254

:param raw_record: The bytes of the knit data from disk.

255

:param annotated: True if the raw data is annotated.

256

"""

257

ContentFactory.__init__(self)

258

self.sha1 = sha1

259

self.key = key

260

self.parents = parents

261

if build_details[0] == 'line-delta':

262

kind = 'delta'

263

else:

264

kind = 'ft'

265

if annotated:

266

annotated_kind = 'annotated-'

267

else:

268

annotated_kind = ''

269

self.storage_kind = 'knit-%s%s-gz' % (annotated_kind, kind)

270

self._raw_record = raw_record

271

self._build_details = build_details

272

self._knit = knit

273

274

def get_bytes_as(self, storage_kind):

275

if storage_kind == self.storage_kind:

276

return self._raw_record

277

if storage_kind == 'fulltext' and self._knit is not None:

278

return self._knit.get_text(self.key[0])

279

else:

280

raise errors.UnavailableRepresentation(self.key, storage_kind,

281

self.storage_kind)

282

283

284

class KnitContent(object):

285

"""Content of a knit version to which deltas can be applied.

286

287

This is always stored in memory as a list of lines with \n at the end,

288

plus a flag saying if the final ending is really there or not, because that

289

corresponds to the on-disk knit representation.

290

"""

291

292

def __init__(self):

293

self._should_strip_eol = False

294

295

def apply_delta(self, delta, new_version_id):

296

"""Apply delta to this object to become new_version_id."""

297

raise NotImplementedError(self.apply_delta)

298

299

def line_delta_iter(self, new_lines):

300

"""Generate line-based delta from this content to new_lines."""

301

new_texts = new_lines.text()

302

old_texts = self.text()

303

s = patiencediff.PatienceSequenceMatcher(None, old_texts, new_texts)

304

for tag, i1, i2, j1, j2 in s.get_opcodes():

305

if tag == 'equal':

306

continue

307

# ofrom, oto, length, data

308

yield i1, i2, j2 - j1, new_lines._lines[j1:j2]

309

310

def line_delta(self, new_lines):

311

return list(self.line_delta_iter(new_lines))

312

313

@staticmethod

314

def get_line_delta_blocks(knit_delta, source, target):

315

"""Extract SequenceMatcher.get_matching_blocks() from a knit delta"""

316

target_len = len(target)

317

s_pos = 0

318

t_pos = 0

319

for s_begin, s_end, t_len, new_text in knit_delta:

320

true_n = s_begin - s_pos

321

n = true_n

322

if n > 0:

323

# knit deltas do not provide reliable info about whether the

324

# last line of a file matches, due to eol handling.

325

if source[s_pos + n -1] != target[t_pos + n -1]:

326

n-=1

327

if n > 0:

328

yield s_pos, t_pos, n

329

t_pos += t_len + true_n

330

s_pos = s_end

331

n = target_len - t_pos

332

if n > 0:

333

if source[s_pos + n -1] != target[t_pos + n -1]:

334

n-=1

335

if n > 0:

336

yield s_pos, t_pos, n

337

yield s_pos + (target_len - t_pos), target_len, 0

338

339

340

class AnnotatedKnitContent(KnitContent):

341

"""Annotated content."""

342

343

def __init__(self, lines):

344

KnitContent.__init__(self)

345

self._lines = lines

346

347

def annotate(self):

348

"""Return a list of (origin, text) for each content line."""

349

lines = self._lines[:]

350

if self._should_strip_eol:

351

origin, last_line = lines[-1]

352

lines[-1] = (origin, last_line.rstrip('\n'))

353

return lines

354

355

def apply_delta(self, delta, new_version_id):

356

"""Apply delta to this object to become new_version_id."""

357

offset = 0

358

lines = self._lines

359

for start, end, count, delta_lines in delta:

360

lines[offset+start:offset+end] = delta_lines

361

offset = offset + (start - end) + count

362

363

def text(self):

364

try:

365

lines = [text for origin, text in self._lines]

366

except ValueError, e:

367

# most commonly (only?) caused by the internal form of the knit

368

# missing annotation information because of a bug - see thread

369

# around 20071015

370

raise KnitCorrupt(self,

371

"line in annotated knit missing annotation information: %s"

372

% (e,))

373

if self._should_strip_eol:

374

lines[-1] = lines[-1].rstrip('\n')

375

return lines

376

377

def copy(self):

378

return AnnotatedKnitContent(self._lines[:])

379

380

381

class PlainKnitContent(KnitContent):

382

"""Unannotated content.

383

384

When annotate[_iter] is called on this content, the same version is reported

385

for all lines. Generally, annotate[_iter] is not useful on PlainKnitContent

386

objects.

387

"""

388

389

def __init__(self, lines, version_id):

390

KnitContent.__init__(self)

391

self._lines = lines

392

self._version_id = version_id

393

394

def annotate(self):

395

"""Return a list of (origin, text) for each content line."""

396

return [(self._version_id, line) for line in self._lines]

397

398

def apply_delta(self, delta, new_version_id):

399

"""Apply delta to this object to become new_version_id."""

400

offset = 0

401

lines = self._lines

402

for start, end, count, delta_lines in delta:

403

lines[offset+start:offset+end] = delta_lines

404

offset = offset + (start - end) + count

405

self._version_id = new_version_id

406

407

def copy(self):

408

return PlainKnitContent(self._lines[:], self._version_id)

409

410

def text(self):

411

lines = self._lines

412

if self._should_strip_eol:

413

lines = lines[:]

414

lines[-1] = lines[-1].rstrip('\n')

415

return lines

416

417

418

class _KnitFactory(object):

419

"""Base class for common Factory functions."""

420

421

def parse_record(self, version_id, record, record_details,

422

base_content, copy_base_content=True):

423

"""Parse a record into a full content object.

424

425

:param version_id: The official version id for this content

426

:param record: The data returned by read_records_iter()

427

:param record_details: Details about the record returned by

428

get_build_details

429

:param base_content: If get_build_details returns a compression_parent,

430

you must return a base_content here, else use None

431

:param copy_base_content: When building from the base_content, decide

432

you can either copy it and return a new object, or modify it in

433

place.

434

:return: (content, delta) A Content object and possibly a line-delta,

435

delta may be None

436

"""

437

method, noeol = record_details

438

if method == 'line-delta':

439

if copy_base_content:

440

content = base_content.copy()

441

else:

442

content = base_content

443

delta = self.parse_line_delta(record, version_id)

444

content.apply_delta(delta, version_id)

445

else:

446

content = self.parse_fulltext(record, version_id)

447

delta = None

448

content._should_strip_eol = noeol

449

return (content, delta)

450

451

452

class KnitAnnotateFactory(_KnitFactory):

453

"""Factory for creating annotated Content objects."""

454

455

annotated = True

456

457

def make(self, lines, version_id):

458

num_lines = len(lines)

459

return AnnotatedKnitContent(zip([version_id] * num_lines, lines))

460

461

def parse_fulltext(self, content, version_id):

462

"""Convert fulltext to internal representation

463

464

fulltext content is of the format

465

revid(utf8) plaintext\n

466

internal representation is of the format:

467

(revid, plaintext)

468

"""

469

# TODO: jam 20070209 The tests expect this to be returned as tuples,

470

# but the code itself doesn't really depend on that.

471

# Figure out a way to not require the overhead of turning the

472

# list back into tuples.

473

lines = [tuple(line.split(' ', 1)) for line in content]

474

return AnnotatedKnitContent(lines)

475

476

def parse_line_delta_iter(self, lines):

477

return iter(self.parse_line_delta(lines))

478

479

def parse_line_delta(self, lines, version_id, plain=False):

480

"""Convert a line based delta into internal representation.

481

482

line delta is in the form of:

483

intstart intend intcount

484

1..count lines:

485

revid(utf8) newline\n

486

internal representation is

487

(start, end, count, [1..count tuples (revid, newline)])

488

489

:param plain: If True, the lines are returned as a plain

490

list without annotations, not as a list of (origin, content) tuples, i.e.

491

(start, end, count, [1..count newline])

492

"""

493

result = []

494

lines = iter(lines)

495

next = lines.next

496

497

cache = {}

498

def cache_and_return(line):

499

origin, text = line.split(' ', 1)

500

return cache.setdefault(origin, origin), text

501

502

# walk through the lines parsing.

503

# Note that the plain test is explicitly pulled out of the

504

# loop to minimise any performance impact

505

if plain:

506

for header in lines:

507

start, end, count = [int(n) for n in header.split(',')]

508

contents = [next().split(' ', 1)[1] for i in xrange(count)]

509

result.append((start, end, count, contents))

510

else:

511

for header in lines:

512

start, end, count = [int(n) for n in header.split(',')]

513

contents = [tuple(next().split(' ', 1)) for i in xrange(count)]

514

result.append((start, end, count, contents))

515

return result

516

517

def get_fulltext_content(self, lines):

518

"""Extract just the content lines from a fulltext."""

519

return (line.split(' ', 1)[1] for line in lines)

520

521

def get_linedelta_content(self, lines):

522

"""Extract just the content from a line delta.

523

524

This doesn't return all of the extra information stored in a delta.

525

Only the actual content lines.

526

"""

527

lines = iter(lines)

528

next = lines.next

529

for header in lines:

530

header = header.split(',')

531

count = int(header[2])

532

for i in xrange(count):

533

origin, text = next().split(' ', 1)

534

yield text

535

536

def lower_fulltext(self, content):

537

"""convert a fulltext content record into a serializable form.

538

539

see parse_fulltext which this inverts.

540

"""

541

# TODO: jam 20070209 We only do the caching thing to make sure that

542

# the origin is a valid utf-8 line, eventually we could remove it

543

return ['%s %s' % (o, t) for o, t in content._lines]

544

545

def lower_line_delta(self, delta):

546

"""convert a delta into a serializable form.

547

548

See parse_line_delta which this inverts.

549

"""

550

# TODO: jam 20070209 We only do the caching thing to make sure that

551

# the origin is a valid utf-8 line, eventually we could remove it

552

out = []

553

for start, end, c, lines in delta:

554

out.append('%d,%d,%d\n' % (start, end, c))

555

out.extend(origin + ' ' + text

556

for origin, text in lines)

557

return out

558

559

def annotate(self, knit, key):

560

content = knit._get_content(key)

561

# adjust for the fact that serialised annotations are only key suffixes

562

# for this factory.

563

if type(key) == tuple:

564

prefix = key[:-1]

565

origins = content.annotate()

566

result = []

567

for origin, line in origins:

568

result.append((prefix + (origin,), line))

569

return result

570

else:

571

# XXX: This smells a bit. Why would key ever be a non-tuple here?

572

# Aren't keys defined to be tuples? -- spiv 20080618

573

return content.annotate()

574

575

576

class KnitPlainFactory(_KnitFactory):

577

"""Factory for creating plain Content objects."""

578

579

annotated = False

580

581

def make(self, lines, version_id):

582

return PlainKnitContent(lines, version_id)

583

584

def parse_fulltext(self, content, version_id):

585

"""This parses an unannotated fulltext.

586

587

Note that this is not a noop - the internal representation

588

has (versionid, line) - its just a constant versionid.

589

"""

590

return self.make(content, version_id)

591

592

def parse_line_delta_iter(self, lines, version_id):

593

cur = 0

594

num_lines = len(lines)

595

while cur < num_lines:

596

header = lines[cur]

597

cur += 1

598

start, end, c = [int(n) for n in header.split(',')]

599

yield start, end, c, lines[cur:cur+c]

600

cur += c

601

602

def parse_line_delta(self, lines, version_id):

603

return list(self.parse_line_delta_iter(lines, version_id))

604

605

def get_fulltext_content(self, lines):

606

"""Extract just the content lines from a fulltext."""

607

return iter(lines)

608

609

def get_linedelta_content(self, lines):

610

"""Extract just the content from a line delta.

611

612

This doesn't return all of the extra information stored in a delta.

613

Only the actual content lines.

614

"""

615

lines = iter(lines)

616

next = lines.next

617

for header in lines:

618

header = header.split(',')

619

count = int(header[2])

620

for i in xrange(count):

621

yield next()

622

623

def lower_fulltext(self, content):

624

return content.text()

625

626

def lower_line_delta(self, delta):

627

out = []

628

for start, end, c, lines in delta:

629

out.append('%d,%d,%d\n' % (start, end, c))

630

out.extend(lines)

631

return out

632

633

def annotate(self, knit, key):

634

annotator = _KnitAnnotator(knit)

635

return annotator.annotate(key)

636

637

638

639

def make_file_factory(annotated, mapper):

640

"""Create a factory for creating a file based KnitVersionedFiles.

641

642

This is only functional enough to run interface tests, it doesn't try to

643

provide a full pack environment.

644

645

:param annotated: knit annotations are wanted.

646

:param mapper: The mapper from keys to paths.

647

"""

648

def factory(transport):

649

index = _KndxIndex(transport, mapper, lambda:None, lambda:True, lambda:True)

650

access = _KnitKeyAccess(transport, mapper)

651

return KnitVersionedFiles(index, access, annotated=annotated)

652

return factory

653

654

655

def make_pack_factory(graph, delta, keylength):

656

"""Create a factory for creating a pack based VersionedFiles.

657

658

This is only functional enough to run interface tests, it doesn't try to

659

provide a full pack environment.

660

661

:param graph: Store a graph.

662

:param delta: Delta compress contents.

663

:param keylength: How long should keys be.

664

"""

665

def factory(transport):

666

parents = graph or delta

667

ref_length = 0

668

if graph:

669

ref_length += 1

670

if delta:

671

ref_length += 1

672

max_delta_chain = 200

673

else:

674

max_delta_chain = 0

675

graph_index = _mod_index.InMemoryGraphIndex(reference_lists=ref_length,

676

key_elements=keylength)

677

stream = transport.open_write_stream('newpack')

678

writer = pack.ContainerWriter(stream.write)

679

writer.begin()

680

index = _KnitGraphIndex(graph_index, lambda:True, parents=parents,

681

deltas=delta, add_callback=graph_index.add_nodes)

682

access = _DirectPackAccess({})

683

access.set_writer(writer, graph_index, (transport, 'newpack'))

684

result = KnitVersionedFiles(index, access,

685

max_delta_chain=max_delta_chain)

686

result.stream = stream

687

result.writer = writer

688

return result

689

return factory

690

691

692

def cleanup_pack_knit(versioned_files):

693

versioned_files.stream.close()

694

versioned_files.writer.end()

695

696

697

class KnitVersionedFiles(VersionedFiles):

698

"""Storage for many versioned files using knit compression.

699

700

Backend storage is managed by indices and data objects.

701

702

:ivar _index: A _KnitGraphIndex or similar that can describe the

703

parents, graph, compression and data location of entries in this

704

KnitVersionedFiles. Note that this is only the index for

705

*this* vfs; if there are fallbacks they must be queried separately.

706

"""

707

708

def __init__(self, index, data_access, max_delta_chain=200,

709

annotated=False):

710

"""Create a KnitVersionedFiles with index and data_access.

711

712

:param index: The index for the knit data.

713

:param data_access: The access object to store and retrieve knit

714

records.

715

:param max_delta_chain: The maximum number of deltas to permit during

716

insertion. Set to 0 to prohibit the use of deltas.

717

:param annotated: Set to True to cause annotations to be calculated and

718

stored during insertion.

719

"""

720

self._index = index

721

self._access = data_access

722

self._max_delta_chain = max_delta_chain

723

if annotated:

724

self._factory = KnitAnnotateFactory()

725

else:

726

self._factory = KnitPlainFactory()

727

self._fallback_vfs = []

728

729

def __repr__(self):

730

return "%s(%r, %r)" % (

731

self.__class__.__name__,

732

self._index,

733

self._access)

734

735

def add_fallback_versioned_files(self, a_versioned_files):

736

"""Add a source of texts for texts not present in this knit.

737

738

:param a_versioned_files: A VersionedFiles object.

739

"""

740

self._fallback_vfs.append(a_versioned_files)

741

742

def add_lines(self, key, parents, lines, parent_texts=None,

743

left_matching_blocks=None, nostore_sha=None, random_id=False,

744

check_content=True):

745

"""See VersionedFiles.add_lines()."""

746

self._index._check_write_ok()

747

self._check_add(key, lines, random_id, check_content)

748

if parents is None:

749

# The caller might pass None if there is no graph data, but kndx

750

# indexes can't directly store that, so we give them

751

# an empty tuple instead.

752

parents = ()

753

return self._add(key, lines, parents,

754

parent_texts, left_matching_blocks, nostore_sha, random_id)

755

756

def _add(self, key, lines, parents, parent_texts,

757

left_matching_blocks, nostore_sha, random_id):

758

"""Add a set of lines on top of version specified by parents.

759

760

Any versions not present will be converted into ghosts.

761

"""

762

# first thing, if the content is something we don't need to store, find

763

# that out.

764

line_bytes = ''.join(lines)

765

digest = sha_string(line_bytes)

766

if nostore_sha == digest:

767

raise errors.ExistingContent

768

769

present_parents = []

770

if parent_texts is None:

771

parent_texts = {}

772

# Do a single query to ascertain parent presence.

773

present_parent_map = self.get_parent_map(parents)

774

for parent in parents:

775

if parent in present_parent_map:

776

present_parents.append(parent)

777

778

# Currently we can only compress against the left most present parent.

779

if (len(present_parents) == 0 or

780

present_parents[0] != parents[0]):

781

delta = False

782

else:

783

# To speed the extract of texts the delta chain is limited

784

# to a fixed number of deltas. This should minimize both

785

# I/O and the time spend applying deltas.

786

delta = self._check_should_delta(present_parents[0])

787

788

text_length = len(line_bytes)

789

options = []

790

if lines:

791

if lines[-1][-1] != '\n':

792

# copy the contents of lines.

793

lines = lines[:]

794

options.append('no-eol')

795

lines[-1] = lines[-1] + '\n'

796

line_bytes += '\n'

797

798

for element in key:

799

if type(element) != str:

800

raise TypeError("key contains non-strings: %r" % (key,))

801

# Knit hunks are still last-element only

802

version_id = key[-1]

803

content = self._factory.make(lines, version_id)

804

if 'no-eol' in options:

805

# Hint to the content object that its text() call should strip the

806

# EOL.

807

content._should_strip_eol = True

808

if delta or (self._factory.annotated and len(present_parents) > 0):

809

# Merge annotations from parent texts if needed.

810

delta_hunks = self._merge_annotations(content, present_parents,

811

parent_texts, delta, self._factory.annotated,

812

left_matching_blocks)

813

814

if delta:

815

options.append('line-delta')

816

store_lines = self._factory.lower_line_delta(delta_hunks)

817

size, bytes = self._record_to_data(key, digest,

818

store_lines)

819

else:

820

options.append('fulltext')

821

# isinstance is slower and we have no hierarchy.

822

if self._factory.__class__ == KnitPlainFactory:

823

# Use the already joined bytes saving iteration time in

824

# _record_to_data.

825

size, bytes = self._record_to_data(key, digest,

826

lines, [line_bytes])

827

else:

828

# get mixed annotation + content and feed it into the

829

# serialiser.

830

store_lines = self._factory.lower_fulltext(content)

831

size, bytes = self._record_to_data(key, digest,

832

store_lines)

833

834

access_memo = self._access.add_raw_records([(key, size)], bytes)[0]

835

self._index.add_records(

836

((key, options, access_memo, parents),),

837

random_id=random_id)

838

return digest, text_length, content

839

840

def annotate(self, key):

841

"""See VersionedFiles.annotate."""

842

return self._factory.annotate(self, key)

843

844

def check(self, progress_bar=None):

845

"""See VersionedFiles.check()."""

846

# This doesn't actually test extraction of everything, but that will

847

# impact 'bzr check' substantially, and needs to be integrated with

848

# care. However, it does check for the obvious problem of a delta with

849

# no basis.

850

keys = self._index.keys()

851

parent_map = self.get_parent_map(keys)

852

for key in keys:

853

if self._index.get_method(key) != 'fulltext':

854

compression_parent = parent_map[key][0]

855

if compression_parent not in parent_map:

856

raise errors.KnitCorrupt(self,

857

"Missing basis parent %s for %s" % (

858

compression_parent, key))

859

for fallback_vfs in self._fallback_vfs:

860

fallback_vfs.check()

861

862

def _check_add(self, key, lines, random_id, check_content):

863

"""check that version_id and lines are safe to add."""

864

version_id = key[-1]

865

if contains_whitespace(version_id):

866

raise InvalidRevisionId(version_id, self)

867

self.check_not_reserved_id(version_id)

868

# TODO: If random_id==False and the key is already present, we should

869

# probably check that the existing content is identical to what is

870

# being inserted, and otherwise raise an exception. This would make

871

# the bundle code simpler.

872

if check_content:

873

self._check_lines_not_unicode(lines)

874

self._check_lines_are_lines(lines)

875

876

def _check_header(self, key, line):

877

rec = self._split_header(line)

878

self._check_header_version(rec, key[-1])

879

return rec

880

881

def _check_header_version(self, rec, version_id):

882

"""Checks the header version on original format knit records.

883

884

These have the last component of the key embedded in the record.

885

"""

886

if rec[1] != version_id:

887

raise KnitCorrupt(self,

888

'unexpected version, wanted %r, got %r' % (version_id, rec[1]))

889

890

def _check_should_delta(self, parent):

891

"""Iterate back through the parent listing, looking for a fulltext.

892

893

This is used when we want to decide whether to add a delta or a new

894

fulltext. It searches for _max_delta_chain parents. When it finds a

895

fulltext parent, it sees if the total size of the deltas leading up to

896

it is large enough to indicate that we want a new full text anyway.

897

898

Return True if we should create a new delta, False if we should use a

899

full text.

900

"""

901

delta_size = 0

902

fulltext_size = None

903

for count in xrange(self._max_delta_chain):

904

# XXX: Collapse these two queries:

905

try:

906

# Note that this only looks in the index of this particular

907

# KnitVersionedFiles, not in the fallbacks. This ensures that

908

# we won't store a delta spanning physical repository

909

# boundaries.

910

method = self._index.get_method(parent)

911

except RevisionNotPresent:

912

# Some basis is not locally present: always delta

913

return False

914

index, pos, size = self._index.get_position(parent)

915

if method == 'fulltext':

916

fulltext_size = size

917

break

918

delta_size += size

919

# We don't explicitly check for presence because this is in an

920

# inner loop, and if it's missing it'll fail anyhow.

921

# TODO: This should be asking for compression parent, not graph

922

# parent.

923

parent = self._index.get_parent_map([parent])[parent][0]

924

else:

925

# We couldn't find a fulltext, so we must create a new one

926

return False

927

# Simple heuristic - if the total I/O wold be greater as a delta than

928

# the originally installed fulltext, we create a new fulltext.

929

return fulltext_size > delta_size

930

931

def _build_details_to_components(self, build_details):

932

"""Convert a build_details tuple to a position tuple."""

933

# record_details, access_memo, compression_parent

934

return build_details[3], build_details[0], build_details[1]

935

936

def _get_components_positions(self, keys, allow_missing=False):

937

"""Produce a map of position data for the components of keys.

938

939

This data is intended to be used for retrieving the knit records.

940

941

A dict of key to (record_details, index_memo, next, parents) is

942

returned.

943

method is the way referenced data should be applied.

944

index_memo is the handle to pass to the data access to actually get the

945

data

946

next is the build-parent of the version, or None for fulltexts.

947

parents is the version_ids of the parents of this version

948

949

:param allow_missing: If True do not raise an error on a missing component,

950

just ignore it.

951

"""

952

component_data = {}

953

pending_components = keys

954

while pending_components:

955

build_details = self._index.get_build_details(pending_components)

956

current_components = set(pending_components)

957

pending_components = set()

958

for key, details in build_details.iteritems():

959

(index_memo, compression_parent, parents,

960

record_details) = details

961

method = record_details[0]

962

if compression_parent is not None:

963

pending_components.add(compression_parent)

964

component_data[key] = self._build_details_to_components(details)

965

missing = current_components.difference(build_details)

966

if missing and not allow_missing:

967

raise errors.RevisionNotPresent(missing.pop(), self)

968

return component_data

969

970

def _get_content(self, key, parent_texts={}):

971

"""Returns a content object that makes up the specified

972

version."""

973

cached_version = parent_texts.get(key, None)

974

if cached_version is not None:

975

# Ensure the cache dict is valid.

976

if not self.get_parent_map([key]):

977

raise RevisionNotPresent(key, self)

978

return cached_version

979

text_map, contents_map = self._get_content_maps([key])

980

return contents_map[key]

981

982

def _get_content_maps(self, keys, nonlocal_keys=None):

983

"""Produce maps of text and KnitContents

984

985

:param keys: The keys to produce content maps for.

986

:param nonlocal_keys: An iterable of keys(possibly intersecting keys)

987

which are known to not be in this knit, but rather in one of the

988

fallback knits.

989

:return: (text_map, content_map) where text_map contains the texts for

990

the requested versions and content_map contains the KnitContents.

991

"""

992

# FUTURE: This function could be improved for the 'extract many' case

993

# by tracking each component and only doing the copy when the number of

994

# children than need to apply delta's to it is > 1 or it is part of the

995

# final output.

996

keys = list(keys)

997

multiple_versions = len(keys) != 1

998

record_map = self._get_record_map(keys, allow_missing=True)

999

1000

text_map = {}

1001

content_map = {}

1002

final_content = {}

1003

if nonlocal_keys is None:

1004

nonlocal_keys = set()

1005

else:

1006

nonlocal_keys = frozenset(nonlocal_keys)

1007

missing_keys = set(nonlocal_keys)

1008

for source in self._fallback_vfs:

1009

if not missing_keys:

1010

break

1011

for record in source.get_record_stream(missing_keys,

1012

'unordered', True):

1013

if record.storage_kind == 'absent':

1014

continue

1015

missing_keys.remove(record.key)

1016

lines = split_lines(record.get_bytes_as('fulltext'))

1017

text_map[record.key] = lines

1018

content_map[record.key] = PlainKnitContent(lines, record.key)

1019

if record.key in keys:

1020

final_content[record.key] = content_map[record.key]

1021

for key in keys:

1022

if key in nonlocal_keys:

1023

# already handled

1024

continue

1025

components = []

1026

cursor = key

1027

while cursor is not None:

1028

try:

1029

record, record_details, digest, next = record_map[cursor]

1030

except KeyError:

1031

raise RevisionNotPresent(cursor, self)

1032

components.append((cursor, record, record_details, digest))

1033

cursor = next

1034

if cursor in content_map:

1035

# no need to plan further back

1036

components.append((cursor, None, None, None))

1037

break

1038

1039

content = None

1040

for (component_id, record, record_details,

1041

digest) in reversed(components):

1042

if component_id in content_map:

1043

content = content_map[component_id]

1044

else:

1045

content, delta = self._factory.parse_record(key[-1],

1046

record, record_details, content,

1047

copy_base_content=multiple_versions)

1048

if multiple_versions:

1049

content_map[component_id] = content

1050

1051

final_content[key] = content

1052

1053

# digest here is the digest from the last applied component.

1054

text = content.text()

1055

actual_sha = sha_strings(text)

1056

if actual_sha != digest:

1057

raise KnitCorrupt(self,

1058

'\n sha-1 %s'

1059

'\n of reconstructed text does not match'

1060

'\n expected %s'

1061

'\n for version %s' %

1062

(actual_sha, digest, key))

1063

text_map[key] = text

1064

return text_map, final_content

1065

1066

def get_parent_map(self, keys):

1067

"""Get a map of the graph parents of keys.

1068

1069

:param keys: The keys to look up parents for.

1070

:return: A mapping from keys to parents. Absent keys are absent from

1071

the mapping.

1072

"""

1073

return self._get_parent_map_with_sources(keys)[0]

1074

1075

def _get_parent_map_with_sources(self, keys):

1076

"""Get a map of the parents of keys.

1077

1078

:param keys: The keys to look up parents for.

1079

:return: A tuple. The first element is a mapping from keys to parents.

1080

Absent keys are absent from the mapping. The second element is a

1081

list with the locations each key was found in. The first element

1082

is the in-this-knit parents, the second the first fallback source,

1083

and so on.

1084

"""

1085

result = {}

1086

sources = [self._index] + self._fallback_vfs

1087

source_results = []

1088

missing = set(keys)

1089

for source in sources:

1090

if not missing:

1091

break

1092

new_result = source.get_parent_map(missing)

1093

source_results.append(new_result)

1094

result.update(new_result)

1095

missing.difference_update(set(new_result))

1096

return result, source_results

1097

1098

def _get_record_map(self, keys, allow_missing=False):

1099

"""Produce a dictionary of knit records.

1100

1101

:return: {key:(record, record_details, digest, next)}

1102

record

1103

data returned from read_records

1104

record_details

1105

opaque information to pass to parse_record

1106

digest

1107

SHA1 digest of the full text after all steps are done

1108

1109

build-parent of the version, i.e. the leftmost ancestor.

1110

Will be None if the record is not a delta.

1111

:param keys: The keys to build a map for

1112

:param allow_missing: If some records are missing, rather than

1113

error, just return the data that could be generated.

1114

"""

1115

position_map = self._get_components_positions(keys,

1116

allow_missing=allow_missing)

1117

# key = component_id, r = record_details, i_m = index_memo, n = next

1118

records = [(key, i_m) for key, (r, i_m, n)

1119

in position_map.iteritems()]

1120

record_map = {}

1121

for key, record, digest in \

1122

self._read_records_iter(records):

1123

(record_details, index_memo, next) = position_map[key]

1124

record_map[key] = record, record_details, digest, next

1125

return record_map

1126

1127

def get_record_stream(self, keys, ordering, include_delta_closure):

1128

"""Get a stream of records for keys.

1129

1130

:param keys: The keys to include.

1131

:param ordering: Either 'unordered' or 'topological'. A topologically

1132

sorted stream has compression parents strictly before their

1133

children.

1134

:param include_delta_closure: If True then the closure across any

1135

compression parents will be included (in the opaque data).

1136

:return: An iterator of ContentFactory objects, each of which is only

1137

valid until the iterator is advanced.

1138

"""

1139

# keys might be a generator

1140

keys = set(keys)

1141

if not keys:

1142

return

1143

if not self._index.has_graph:

1144

# Cannot topological order when no graph has been stored.

1145

ordering = 'unordered'

1146

if include_delta_closure:

1147

positions = self._get_components_positions(keys, allow_missing=True)

1148

else:

1149

build_details = self._index.get_build_details(keys)

1150

# map from key to

1151

# (record_details, access_memo, compression_parent_key)

1152

positions = dict((key, self._build_details_to_components(details))

1153

for key, details in build_details.iteritems())

1154

absent_keys = keys.difference(set(positions))

1155

# There may be more absent keys : if we're missing the basis component

1156

# and are trying to include the delta closure.

1157

if include_delta_closure:

1158

needed_from_fallback = set()

1159

# Build up reconstructable_keys dict. key:True in this dict means

1160

# the key can be reconstructed.

1161

reconstructable_keys = {}

1162

for key in keys:

1163

# the delta chain

1164

try:

1165

chain = [key, positions[key][2]]

1166

except KeyError:

1167

needed_from_fallback.add(key)

1168

continue

1169

result = True

1170

while chain[-1] is not None:

1171

if chain[-1] in reconstructable_keys:

1172

result = reconstructable_keys[chain[-1]]

1173

break

1174

else:

1175

try:

1176

chain.append(positions[chain[-1]][2])

1177

except KeyError:

1178

# missing basis component

1179

needed_from_fallback.add(chain[-1])

1180

result = True

1181

break

1182

for chain_key in chain[:-1]:

1183

reconstructable_keys[chain_key] = result

1184

if not result:

1185

needed_from_fallback.add(key)

1186

# Double index lookups here : need a unified api ?

1187

global_map, parent_maps = self._get_parent_map_with_sources(keys)

1188

if ordering == 'topological':

1189

# Global topological sort

1190

present_keys = tsort.topo_sort(global_map)

1191

# Now group by source:

1192

source_keys = []

1193

current_source = None

1194

for key in present_keys:

1195

for parent_map in parent_maps:

1196

if key in parent_map:

1197

key_source = parent_map

1198

break

1199

if current_source is not key_source:

1200

source_keys.append((key_source, []))

1201

current_source = key_source

1202

source_keys[-1][1].append(key)

1203

else:

1204

if ordering != 'unordered':

1205

raise AssertionError('valid values for ordering are:'

1206

' "unordered" or "topological" not: %r'

1207

% (ordering,))

1208

# Just group by source; remote sources first.

1209

present_keys = []

1210

source_keys = []

1211

for parent_map in reversed(parent_maps):

1212

source_keys.append((parent_map, []))

1213

for key in parent_map:

1214

present_keys.append(key)

1215

source_keys[-1][1].append(key)

1216

absent_keys = keys - set(global_map)

1217

for key in absent_keys:

1218

yield AbsentContentFactory(key)

1219

# restrict our view to the keys we can answer.

1220

# XXX: Memory: TODO: batch data here to cap buffered data at (say) 1MB.

1221

# XXX: At that point we need to consider the impact of double reads by

1222

# utilising components multiple times.

1223

if include_delta_closure:

1224

# XXX: get_content_maps performs its own index queries; allow state

1225

# to be passed in.

1226

text_map, _ = self._get_content_maps(present_keys,

1227

needed_from_fallback - absent_keys)

1228

for key in present_keys:

1229

yield FulltextContentFactory(key, global_map[key], None,

1230

''.join(text_map[key]))

1231

else:

1232

for source, keys in source_keys:

1233

if source is parent_maps[0]:

1234

# this KnitVersionedFiles

1235

records = [(key, positions[key][1]) for key in keys]

1236

for key, raw_data, sha1 in self._read_records_iter_raw(records):

1237

(record_details, index_memo, _) = positions[key]

1238

yield KnitContentFactory(key, global_map[key],

1239

record_details, sha1, raw_data, self._factory.annotated, None)

1240

else:

1241

vf = self._fallback_vfs[parent_maps.index(source) - 1]

1242

for record in vf.get_record_stream(keys, ordering,

1243

include_delta_closure):

1244

yield record

1245

1246

def get_sha1s(self, keys):

1247

"""See VersionedFiles.get_sha1s()."""

1248

missing = set(keys)

1249

record_map = self._get_record_map(missing, allow_missing=True)

1250

result = {}

1251

for key, details in record_map.iteritems():

1252

if key not in missing:

1253

continue

1254

# record entry 2 is the 'digest'.

1255

result[key] = details[2]

1256

missing.difference_update(set(result))

1257

for source in self._fallback_vfs:

1258

if not missing:

1259

break

1260

new_result = source.get_sha1s(missing)

1261

result.update(new_result)

1262

missing.difference_update(set(new_result))

1263

return result

1264

1265

def insert_record_stream(self, stream):

1266

"""Insert a record stream into this container.

1267

1268

:param stream: A stream of records to insert.

1269

:return: None

1270

:seealso VersionedFiles.get_record_stream:

1271

"""

1272

def get_adapter(adapter_key):

1273

try:

1274

return adapters[adapter_key]

1275

except KeyError:

1276

adapter_factory = adapter_registry.get(adapter_key)

1277

adapter = adapter_factory(self)

1278

adapters[adapter_key] = adapter

1279

return adapter

1280

if self._factory.annotated:

1281

# self is annotated, we need annotated knits to use directly.

1282

annotated = "annotated-"

1283

convertibles = []

1284

else:

1285

# self is not annotated, but we can strip annotations cheaply.

1286

annotated = ""

1287

convertibles = set(["knit-annotated-ft-gz"])

1288

if self._max_delta_chain:

1289

convertibles.add("knit-annotated-delta-gz")

1290

# The set of types we can cheaply adapt without needing basis texts.

1291

native_types = set()

1292

if self._max_delta_chain:

1293

native_types.add("knit-%sdelta-gz" % annotated)

1294

native_types.add("knit-%sft-gz" % annotated)

1295

knit_types = native_types.union(convertibles)

1296

adapters = {}

1297

# Buffer all index entries that we can't add immediately because their

1298

# basis parent is missing. We don't buffer all because generating

1299

# annotations may require access to some of the new records. However we

1300

# can't generate annotations from new deltas until their basis parent

1301

# is present anyway, so we get away with not needing an index that

1302

# includes the new keys.

1303

# key = basis_parent, value = index entry to add

1304

buffered_index_entries = {}

1305

for record in stream:

1306

parents = record.parents

1307

# Raise an error when a record is missing.

1308

if record.storage_kind == 'absent':

1309

raise RevisionNotPresent([record.key], self)

1310

if record.storage_kind in knit_types:

1311

if record.storage_kind not in native_types:

1312

try:

1313

adapter_key = (record.storage_kind, "knit-delta-gz")

1314

adapter = get_adapter(adapter_key)

1315

except KeyError:

1316

adapter_key = (record.storage_kind, "knit-ft-gz")

1317

adapter = get_adapter(adapter_key)

1318

bytes = adapter.get_bytes(

1319

record, record.get_bytes_as(record.storage_kind))

1320

else:

1321

bytes = record.get_bytes_as(record.storage_kind)

1322

options = [record._build_details[0]]

1323

if record._build_details[1]:

1324

options.append('no-eol')

1325

# Just blat it across.

1326

# Note: This does end up adding data on duplicate keys. As

1327

# modern repositories use atomic insertions this should not

1328

# lead to excessive growth in the event of interrupted fetches.

1329

# 'knit' repositories may suffer excessive growth, but as a

1330

# deprecated format this is tolerable. It can be fixed if

1331

# needed by in the kndx index support raising on a duplicate

1332

# add with identical parents and options.

1333

access_memo = self._access.add_raw_records(

1334

[(record.key, len(bytes))], bytes)[0]

1335

index_entry = (record.key, options, access_memo, parents)

1336

buffered = False

1337

if 'fulltext' not in options:

1338

basis_parent = parents[0]

1339

# Note that pack backed knits don't need to buffer here

1340

# because they buffer all writes to the transaction level,

1341

# but we don't expose that difference at the index level. If

1342

# the query here has sufficient cost to show up in

1343

# profiling we should do that.

1344

if basis_parent not in self.get_parent_map([basis_parent]):

1345

pending = buffered_index_entries.setdefault(

1346

basis_parent, [])

1347

pending.append(index_entry)

1348

buffered = True

1349

if not buffered:

1350

self._index.add_records([index_entry])

1351

elif record.storage_kind == 'fulltext':

1352

self.add_lines(record.key, parents,

1353

split_lines(record.get_bytes_as('fulltext')))

1354

else:

1355

adapter_key = record.storage_kind, 'fulltext'

1356

adapter = get_adapter(adapter_key)

1357

lines = split_lines(adapter.get_bytes(

1358

record, record.get_bytes_as(record.storage_kind)))

1359

try:

1360

self.add_lines(record.key, parents, lines)

1361

except errors.RevisionAlreadyPresent:

1362

pass

1363

# Add any records whose basis parent is now available.

1364

added_keys = [record.key]

1365

while added_keys:

1366

key = added_keys.pop(0)

1367

if key in buffered_index_entries:

1368

index_entries = buffered_index_entries[key]

1369

self._index.add_records(index_entries)

1370

added_keys.extend(

1371

[index_entry[0] for index_entry in index_entries])

1372

del buffered_index_entries[key]

1373

# If there were any deltas which had a missing basis parent, error.

1374

if buffered_index_entries:

1375

raise errors.RevisionNotPresent(buffered_index_entries.keys()[0],

1376

self)

1377

1378

def iter_lines_added_or_present_in_keys(self, keys, pb=None):

1379

"""Iterate over the lines in the versioned files from keys.

1380

1381

This may return lines from other keys. Each item the returned

1382

iterator yields is a tuple of a line and a text version that that line

1383

is present in (not introduced in).

1384

1385

Ordering of results is in whatever order is most suitable for the

1386

underlying storage format.

1387

1388

If a progress bar is supplied, it may be used to indicate progress.

1389

The caller is responsible for cleaning up progress bars (because this

1390

is an iterator).

1391

1392

NOTES:

1393

* Lines are normalised by the underlying store: they will all have \n

1394

terminators.

1395

* Lines are returned in arbitrary order.

1396

1397

:return: An iterator over (line, key).

1398

"""

1399

if pb is None:

1400

pb = progress.DummyProgress()

1401

keys = set(keys)

1402

total = len(keys)

1403

# we don't care about inclusions, the caller cares.

1404

# but we need to setup a list of records to visit.

1405

# we need key, position, length

1406

key_records = []

1407

build_details = self._index.get_build_details(keys)

1408

for key, details in build_details.iteritems():

1409

if key in keys:

1410

key_records.append((key, details[0]))

1411

keys.remove(key)

1412

records_iter = enumerate(self._read_records_iter(key_records))

1413

for (key_idx, (key, data, sha_value)) in records_iter:

1414

pb.update('Walking content.', key_idx, total)

1415

compression_parent = build_details[key][1]

1416

if compression_parent is None:

1417

# fulltext

1418

line_iterator = self._factory.get_fulltext_content(data)

1419

else:

1420

# Delta

1421

line_iterator = self._factory.get_linedelta_content(data)

1422

# XXX: It might be more efficient to yield (key,

1423

# line_iterator) in the future. However for now, this is a simpler

1424

# change to integrate into the rest of the codebase. RBC 20071110

1425

for line in line_iterator:

1426

yield line, key

1427

for source in self._fallback_vfs:

1428

if not keys:

1429

break

1430

source_keys = set()

1431

for line, key in source.iter_lines_added_or_present_in_keys(keys):

1432

source_keys.add(key)

1433

yield line, key

1434

keys.difference_update(source_keys)

1435

if keys:

1436

raise RevisionNotPresent(keys, self.filename)

1437

pb.update('Walking content.', total, total)

1438

1439

def _make_line_delta(self, delta_seq, new_content):

1440

"""Generate a line delta from delta_seq and new_content."""

1441

diff_hunks = []

1442

for op in delta_seq.get_opcodes():

1443

if op[0] == 'equal':

1444

continue

1445

diff_hunks.append((op[1], op[2], op[4]-op[3], new_content._lines[op[3]:op[4]]))

1446

return diff_hunks

1447

1448

def _merge_annotations(self, content, parents, parent_texts={},

1449

delta=None, annotated=None,

1450

left_matching_blocks=None):

1451

"""Merge annotations for content and generate deltas.

1452

1453

This is done by comparing the annotations based on changes to the text

1454

and generating a delta on the resulting full texts. If annotations are

1455

not being created then a simple delta is created.

1456

"""

1457

if left_matching_blocks is not None:

1458

delta_seq = diff._PrematchedMatcher(left_matching_blocks)

1459

else:

1460

delta_seq = None

1461

if annotated:

1462

for parent_key in parents:

1463

merge_content = self._get_content(parent_key, parent_texts)

1464

if (parent_key == parents[0] and delta_seq is not None):

1465

seq = delta_seq

1466

else:

1467

seq = patiencediff.PatienceSequenceMatcher(

1468

None, merge_content.text(), content.text())

1469

for i, j, n in seq.get_matching_blocks():

1470

if n == 0:

1471

continue

1472

# this copies (origin, text) pairs across to the new

1473

# content for any line that matches the last-checked

1474

# parent.

1475

content._lines[j:j+n] = merge_content._lines[i:i+n]

1476

# XXX: Robert says the following block is a workaround for a

1477

# now-fixed bug and it can probably be deleted. -- mbp 20080618

1478

if content._lines and content._lines[-1][1][-1] != '\n':

1479

# The copied annotation was from a line without a trailing EOL,

1480

# reinstate one for the content object, to ensure correct

1481

# serialization.

1482

line = content._lines[-1][1] + '\n'

1483

content._lines[-1] = (content._lines[-1][0], line)

1484

if delta:

1485

if delta_seq is None:

1486

reference_content = self._get_content(parents[0], parent_texts)

1487

new_texts = content.text()

1488

old_texts = reference_content.text()

1489

delta_seq = patiencediff.PatienceSequenceMatcher(

1490

None, old_texts, new_texts)

1491

return self._make_line_delta(delta_seq, content)

1492

1493

def _parse_record(self, version_id, data):

1494

"""Parse an original format knit record.

1495

1496

These have the last element of the key only present in the stored data.

1497

"""

1498

rec, record_contents = self._parse_record_unchecked(data)

1499

self._check_header_version(rec, version_id)

1500

return record_contents, rec[3]

1501

1502

def _parse_record_header(self, key, raw_data):

1503

"""Parse a record header for consistency.

1504

1505

:return: the header and the decompressor stream.

1506

as (stream, header_record)

1507

"""

1508

df = tuned_gzip.GzipFile(mode='rb', fileobj=StringIO(raw_data))

1509

try:

1510

# Current serialise

1511

rec = self._check_header(key, df.readline())

1512

except Exception, e:

1513

raise KnitCorrupt(self,

1514

"While reading {%s} got %s(%s)"

1515

% (key, e.__class__.__name__, str(e)))

1516

return df, rec

1517

1518

def _parse_record_unchecked(self, data):

1519

# profiling notes:

1520

# 4168 calls in 2880 217 internal

1521

# 4168 calls to _parse_record_header in 2121

1522

# 4168 calls to readlines in 330

1523

df = tuned_gzip.GzipFile(mode='rb', fileobj=StringIO(data))

1524

try:

1525

record_contents = df.readlines()

1526

except Exception, e:

1527

raise KnitCorrupt(self, "Corrupt compressed record %r, got %s(%s)" %

1528

(data, e.__class__.__name__, str(e)))

1529

header = record_contents.pop(0)

1530

rec = self._split_header(header)

1531

last_line = record_contents.pop()

1532

if len(record_contents) != int(rec[2]):

1533

raise KnitCorrupt(self,

1534

'incorrect number of lines %s != %s'

1535

' for version {%s} %s'

1536

% (len(record_contents), int(rec[2]),

1537

rec[1], record_contents))

1538

if last_line != 'end %s\n' % rec[1]:

1539

raise KnitCorrupt(self,

1540

'unexpected version end line %r, wanted %r'

1541

% (last_line, rec[1]))

1542

df.close()

1543

return rec, record_contents

1544

1545

def _read_records_iter(self, records):

1546

"""Read text records from data file and yield result.

1547

1548

The result will be returned in whatever is the fastest to read.

1549

Not by the order requested. Also, multiple requests for the same

1550

record will only yield 1 response.

1551

:param records: A list of (key, access_memo) entries

1552

:return: Yields (key, contents, digest) in the order

1553

read, not the order requested

1554

"""

1555

if not records:

1556

return

1557

1558

# XXX: This smells wrong, IO may not be getting ordered right.

1559

needed_records = sorted(set(records), key=operator.itemgetter(1))

1560

if not needed_records:

1561

return

1562

1563

# The transport optimizes the fetching as well

1564

# (ie, reads continuous ranges.)

1565

raw_data = self._access.get_raw_records(

1566

[index_memo for key, index_memo in needed_records])

1567

1568

for (key, index_memo), data in \

1569

izip(iter(needed_records), raw_data):

1570

content, digest = self._parse_record(key[-1], data)

1571

yield key, content, digest

1572

1573

def _read_records_iter_raw(self, records):

1574

"""Read text records from data file and yield raw data.

1575

1576

This unpacks enough of the text record to validate the id is

1577

as expected but thats all.

1578

1579

Each item the iterator yields is (key, bytes, sha1_of_full_text).

1580

"""

1581

# setup an iterator of the external records:

1582

# uses readv so nice and fast we hope.

1583

if len(records):

1584

# grab the disk data needed.

1585

needed_offsets = [index_memo for key, index_memo

1586

in records]

1587

raw_records = self._access.get_raw_records(needed_offsets)

1588

1589

for key, index_memo in records:

1590

data = raw_records.next()

1591

# validate the header (note that we can only use the suffix in

1592

# current knit records).

1593

df, rec = self._parse_record_header(key, data)

1594

df.close()

1595

yield key, data, rec[3]

1596

1597

def _record_to_data(self, key, digest, lines, dense_lines=None):

1598

"""Convert key, digest, lines into a raw data block.

1599

1600

:param key: The key of the record. Currently keys are always serialised

1601

using just the trailing component.

1602

:param dense_lines: The bytes of lines but in a denser form. For

1603

instance, if lines is a list of 1000 bytestrings each ending in \n,

1604

dense_lines may be a list with one line in it, containing all the

1605

1000's lines and their \n's. Using dense_lines if it is already

1606

known is a win because the string join to create bytes in this

1607

function spends less time resizing the final string.

1608

:return: (len, a StringIO instance with the raw data ready to read.)

1609

"""

1610

# Note: using a string copy here increases memory pressure with e.g.

1611

# ISO's, but it is about 3 seconds faster on a 1.2Ghz intel machine

1612

# when doing the initial commit of a mozilla tree. RBC 20070921

1613

bytes = ''.join(chain(

1614

["version %s %d %s\n" % (key[-1],

1615

len(lines),

1616

digest)],

1617

dense_lines or lines,

1618

["end %s\n" % key[-1]]))

1619

if type(bytes) != str:

1620

raise AssertionError(

1621

'data must be plain bytes was %s' % type(bytes))

1622

if lines and lines[-1][-1] != '\n':

1623

raise ValueError('corrupt lines value %r' % lines)

1624

compressed_bytes = tuned_gzip.bytes_to_gzip(bytes)

1625

return len(compressed_bytes), compressed_bytes

1626

1627

def _split_header(self, line):

1628

rec = line.split()

1629

if len(rec) != 4:

1630

raise KnitCorrupt(self,

1631

'unexpected number of elements in record header')

1632

return rec

1633

1634

def keys(self):

1635

"""See VersionedFiles.keys."""

1636

if 'evil' in debug.debug_flags:

1637

trace.mutter_callsite(2, "keys scales with size of history")

1638

sources = [self._index] + self._fallback_vfs

1639

result = set()

1640

for source in sources:

1641

result.update(source.keys())

1642

return result

1643

1644

1645

1646

class _KndxIndex(object):

1647

"""Manages knit index files

1648

1649

The index is kept in memory and read on startup, to enable

1650

fast lookups of revision information. The cursor of the index

1651

file is always pointing to the end, making it easy to append

1652

entries.

1653

1654

_cache is a cache for fast mapping from version id to a Index

1655

object.

1656

1657

_history is a cache for fast mapping from indexes to version ids.

1658

1659

The index data format is dictionary compressed when it comes to

1660

parent references; a index entry may only have parents that with a

1661

lover index number. As a result, the index is topological sorted.

1662

1663

Duplicate entries may be written to the index for a single version id

1664

if this is done then the latter one completely replaces the former:

1665

this allows updates to correct version and parent information.

1666

Note that the two entries may share the delta, and that successive

1667

annotations and references MUST point to the first entry.

1668

1669

The index file on disc contains a header, followed by one line per knit

1670

record. The same revision can be present in an index file more than once.

1671

The first occurrence gets assigned a sequence number starting from 0.

1672

1673

The format of a single line is

1674

REVISION_ID FLAGS BYTE_OFFSET LENGTH( PARENT_ID|PARENT_SEQUENCE_ID)* :\n

1675

REVISION_ID is a utf8-encoded revision id

1676

FLAGS is a comma separated list of flags about the record. Values include

1677

no-eol, line-delta, fulltext.

1678

BYTE_OFFSET is the ascii representation of the byte offset in the data file

1679

that the the compressed data starts at.

1680

LENGTH is the ascii representation of the length of the data file.

1681

PARENT_ID a utf-8 revision id prefixed by a '.' that is a parent of

1682

REVISION_ID.

1683

PARENT_SEQUENCE_ID the ascii representation of the sequence number of a

1684

revision id already in the knit that is a parent of REVISION_ID.

1685

The ' :' marker is the end of record marker.

1686

1687

partial writes:

1688

when a write is interrupted to the index file, it will result in a line

1689

that does not end in ' :'. If the ' :' is not present at the end of a line,

1690

or at the end of the file, then the record that is missing it will be

1691

ignored by the parser.

1692

1693

When writing new records to the index file, the data is preceded by '\n'

1694

to ensure that records always start on new lines even if the last write was

1695

interrupted. As a result its normal for the last line in the index to be

1696

missing a trailing newline. One can be added with no harmful effects.

1697

1698

:ivar _kndx_cache: dict from prefix to the old state of KnitIndex objects,

1699

where prefix is e.g. the (fileid,) for .texts instances or () for

1700

constant-mapped things like .revisions, and the old state is

1701

tuple(history_vector, cache_dict). This is used to prevent having an

1702

ABI change with the C extension that reads .kndx files.

1703

"""

1704

1705

HEADER = "# bzr knit index 8\n"

1706

1707

def __init__(self, transport, mapper, get_scope, allow_writes, is_locked):

1708

"""Create a _KndxIndex on transport using mapper."""

1709

self._transport = transport

1710

self._mapper = mapper

1711

self._get_scope = get_scope

1712

self._allow_writes = allow_writes

1713

self._is_locked = is_locked

1714

self._reset_cache()

1715

self.has_graph = True

1716

1717

def add_records(self, records, random_id=False):

1718

"""Add multiple records to the index.

1719

1720

:param records: a list of tuples:

1721

(key, options, access_memo, parents).

1722

:param random_id: If True the ids being added were randomly generated

1723

and no check for existence will be performed.

1724

"""

1725

paths = {}

1726

for record in records:

1727

key = record[0]

1728

prefix = key[:-1]

1729

path = self._mapper.map(key) + '.kndx'

1730

path_keys = paths.setdefault(path, (prefix, []))

1731

path_keys[1].append(record)

1732

for path in sorted(paths):

1733

prefix, path_keys = paths[path]

1734

self._load_prefixes([prefix])

1735

lines = []

1736

orig_history = self._kndx_cache[prefix][1][:]

1737

orig_cache = self._kndx_cache[prefix][0].copy()

1738

1739

try:

1740

for key, options, (_, pos, size), parents in path_keys:

1741

if parents is None:

1742

# kndx indices cannot be parentless.

1743

parents = ()

1744

line = "\n%s %s %s %s %s :" % (

1745

key[-1], ','.join(options), pos, size,

1746

self._dictionary_compress(parents))

1747

if type(line) != str:

1748

raise AssertionError(

1749

'data must be utf8 was %s' % type(line))

1750

lines.append(line)

1751

self._cache_key(key, options, pos, size, parents)

1752

if len(orig_history):

1753

self._transport.append_bytes(path, ''.join(lines))

1754

else:

1755

self._init_index(path, lines)

1756

except:

1757

# If any problems happen, restore the original values and re-raise

1758

self._kndx_cache[prefix] = (orig_cache, orig_history)

1759

raise

1760

1761

def _cache_key(self, key, options, pos, size, parent_keys):

1762

"""Cache a version record in the history array and index cache.

1763

1764

This is inlined into _load_data for performance. KEEP IN SYNC.

1765

(It saves 60ms, 25% of the __init__ overhead on local 4000 record

1766

indexes).

1767

"""

1768

prefix = key[:-1]

1769

version_id = key[-1]

1770

# last-element only for compatibilty with the C load_data.

1771

parents = tuple(parent[-1] for parent in parent_keys)

1772

for parent in parent_keys:

1773

if parent[:-1] != prefix:

1774

raise ValueError("mismatched prefixes for %r, %r" % (

1775

key, parent_keys))

1776

cache, history = self._kndx_cache[prefix]

1777

# only want the _history index to reference the 1st index entry

1778

# for version_id

1779

if version_id not in cache:

1780

index = len(history)

1781

history.append(version_id)

1782

else:

1783

index = cache[version_id][5]

1784

cache[version_id] = (version_id,

1785

options,

1786

pos,

1787

size,

1788

parents,

1789

index)

1790

1791

def check_header(self, fp):

1792

line = fp.readline()

1793

if line == '':

1794

# An empty file can actually be treated as though the file doesn't

1795

# exist yet.

1796

raise errors.NoSuchFile(self)

1797

if line != self.HEADER:

1798

raise KnitHeaderError(badline=line, filename=self)

1799

1800

def _check_read(self):

1801

if not self._is_locked():

1802

raise errors.ObjectNotLocked(self)

1803

if self._get_scope() != self._scope:

1804

self._reset_cache()

1805

1806

def _check_write_ok(self):

1807

"""Assert if not writes are permitted."""

1808

if not self._is_locked():

1809

raise errors.ObjectNotLocked(self)

1810

if self._get_scope() != self._scope:

1811

self._reset_cache()

1812

if self._mode != 'w':

1813

raise errors.ReadOnlyObjectDirtiedError(self)

1814

1815

def get_build_details(self, keys):

1816

"""Get the method, index_memo and compression parent for keys.

1817

1818

Ghosts are omitted from the result.

1819

1820

:param keys: An iterable of keys.

1821

:return: A dict of key:(index_memo, compression_parent, parents,

1822

record_details).

1823

index_memo

1824

opaque structure to pass to read_records to extract the raw

1825

data

1826

compression_parent

1827

Content that this record is built upon, may be None

1828

parents

1829

Logical parents of this node

1830

record_details

1831

extra information about the content which needs to be passed to

1832

Factory.parse_record

1833

"""

1834

prefixes = self._partition_keys(keys)

1835

parent_map = self.get_parent_map(keys)

1836

result = {}

1837

for key in keys:

1838

if key not in parent_map:

1839

continue # Ghost

1840

method = self.get_method(key)

1841

parents = parent_map[key]

1842

if method == 'fulltext':

1843

compression_parent = None

1844

else:

1845

compression_parent = parents[0]

1846

noeol = 'no-eol' in self.get_options(key)

1847

index_memo = self.get_position(key)

1848

result[key] = (index_memo, compression_parent,

1849

parents, (method, noeol))

1850

return result

1851

1852

def get_method(self, key):

1853

"""Return compression method of specified key."""

1854

options = self.get_options(key)

1855

if 'fulltext' in options:

1856

return 'fulltext'

1857

elif 'line-delta' in options:

1858

return 'line-delta'

1859

else:

1860

raise errors.KnitIndexUnknownMethod(self, options)

1861

1862

def get_options(self, key):

1863

"""Return a list representing options.

1864

1865

e.g. ['foo', 'bar']

1866

"""

1867

prefix, suffix = self._split_key(key)

1868

self._load_prefixes([prefix])

1869

try:

1870

return self._kndx_cache[prefix][0][suffix][1]

1871

except KeyError:

1872

raise RevisionNotPresent(key, self)

1873

1874

def get_parent_map(self, keys):

1875

"""Get a map of the parents of keys.

1876

1877

:param keys: The keys to look up parents for.

1878

:return: A mapping from keys to parents. Absent keys are absent from

1879

the mapping.

1880

"""

1881

# Parse what we need to up front, this potentially trades off I/O

1882

# locality (.kndx and .knit in the same block group for the same file

1883

# id) for less checking in inner loops.

1884

prefixes = set(key[:-1] for key in keys)

1885

self._load_prefixes(prefixes)

1886

result = {}

1887

for key in keys:

1888

prefix = key[:-1]

1889

try:

1890

suffix_parents = self._kndx_cache[prefix][0][key[-1]][4]

1891

except KeyError:

1892

pass

1893

else:

1894

result[key] = tuple(prefix + (suffix,) for

1895

suffix in suffix_parents)

1896

return result

1897

1898

def get_position(self, key):

1899

"""Return details needed to access the version.

1900

1901

:return: a tuple (key, data position, size) to hand to the access

1902

logic to get the record.

1903

"""

1904

prefix, suffix = self._split_key(key)

1905

self._load_prefixes([prefix])

1906

entry = self._kndx_cache[prefix][0][suffix]

1907

return key, entry[2], entry[3]

1908

1909

def _init_index(self, path, extra_lines=[]):

1910

"""Initialize an index."""

1911

sio = StringIO()

1912

sio.write(self.HEADER)

1913

sio.writelines(extra_lines)

1914

sio.seek(0)

1915

self._transport.put_file_non_atomic(path, sio,

1916

create_parent_dir=True)

1917

# self._create_parent_dir)

1918

# mode=self._file_mode,

1919

# dir_mode=self._dir_mode)

1920

1921

def keys(self):

1922

"""Get all the keys in the collection.

1923

1924

The keys are not ordered.

1925

"""

1926

result = set()

1927

# Identify all key prefixes.

1928

# XXX: A bit hacky, needs polish.

1929

if type(self._mapper) == ConstantMapper:

1930

prefixes = [()]

1931

else:

1932

relpaths = set()

1933

for quoted_relpath in self._transport.iter_files_recursive():

1934

path, ext = os.path.splitext(quoted_relpath)

1935

relpaths.add(path)

1936

prefixes = [self._mapper.unmap(path) for path in relpaths]

1937

self._load_prefixes(prefixes)

1938

for prefix in prefixes:

1939

for suffix in self._kndx_cache[prefix][1]:

1940

result.add(prefix + (suffix,))

1941

return result

1942

1943

def _load_prefixes(self, prefixes):

1944

"""Load the indices for prefixes."""

1945

self._check_read()

1946

for prefix in prefixes:

1947

if prefix not in self._kndx_cache:

1948

# the load_data interface writes to these variables.

1949

self._cache = {}

1950

self._history = []

1951

self._filename = prefix

1952

try:

1953

path = self._mapper.map(prefix) + '.kndx'

1954

fp = self._transport.get(path)

1955

try:

1956

# _load_data may raise NoSuchFile if the target knit is

1957

# completely empty.

1958

_load_data(self, fp)

1959

finally:

1960

fp.close()

1961

self._kndx_cache[prefix] = (self._cache, self._history)

1962

del self._cache

1963

del self._filename

1964

del self._history

1965

except NoSuchFile:

1966

self._kndx_cache[prefix] = ({}, [])

1967

if type(self._mapper) == ConstantMapper:

1968

# preserve behaviour for revisions.kndx etc.

1969

self._init_index(path)

1970

del self._cache

1971

del self._filename

1972

del self._history

1973

1974

def _partition_keys(self, keys):

1975

"""Turn keys into a dict of prefix:suffix_list."""

1976

result = {}

1977

for key in keys:

1978

prefix_keys = result.setdefault(key[:-1], [])

1979

prefix_keys.append(key[-1])

1980

return result

1981

1982

def _dictionary_compress(self, keys):

1983

"""Dictionary compress keys.

1984

1985

:param keys: The keys to generate references to.

1986

:return: A string representation of keys. keys which are present are

1987

dictionary compressed, and others are emitted as fulltext with a

1988

'.' prefix.

1989

"""

1990

if not keys:

1991

return ''

1992

result_list = []

1993

prefix = keys[0][:-1]

1994

cache = self._kndx_cache[prefix][0]

1995

for key in keys:

1996

if key[:-1] != prefix:

1997

# kndx indices cannot refer across partitioned storage.

1998

raise ValueError("mismatched prefixes for %r" % keys)

1999

if key[-1] in cache:

2000

# -- inlined lookup() --

2001

result_list.append(str(cache[key[-1]][5]))

2002

# -- end lookup () --

2003

else:

2004

result_list.append('.' + key[-1])

2005

return ' '.join(result_list)

2006

2007

def _reset_cache(self):

2008

# Possibly this should be a LRU cache. A dictionary from key_prefix to

2009

# (cache_dict, history_vector) for parsed kndx files.

2010

self._kndx_cache = {}

2011

self._scope = self._get_scope()

2012

allow_writes = self._allow_writes()

2013

if allow_writes:

2014

self._mode = 'w'

2015

else:

2016

self._mode = 'r'

2017

2018

def _split_key(self, key):

2019

"""Split key into a prefix and suffix."""

2020

return key[:-1], key[-1]

2021

2022

2023

class _KnitGraphIndex(object):

2024

"""A KnitVersionedFiles index layered on GraphIndex."""

2025

2026

def __init__(self, graph_index, is_locked, deltas=False, parents=True,

2027

add_callback=None):

2028

"""Construct a KnitGraphIndex on a graph_index.

2029

2030

:param graph_index: An implementation of bzrlib.index.GraphIndex.

2031

:param is_locked: A callback to check whether the object should answer

2032

queries.

2033

:param deltas: Allow delta-compressed records.

2034

:param parents: If True, record knits parents, if not do not record

2035

parents.

2036

:param add_callback: If not None, allow additions to the index and call

2037

this callback with a list of added GraphIndex nodes:

2038

[(node, value, node_refs), ...]

2039

:param is_locked: A callback, returns True if the index is locked and

2040

thus usable.

2041

"""

2042

self._add_callback = add_callback

2043

self._graph_index = graph_index

2044

self._deltas = deltas

2045

self._parents = parents

2046

if deltas and not parents:

2047

# XXX: TODO: Delta tree and parent graph should be conceptually

2048

# separate.

2049

raise KnitCorrupt(self, "Cannot do delta compression without "

2050

"parent tracking.")

2051

self.has_graph = parents

2052

self._is_locked = is_locked

2053

2054

def __repr__(self):

2055

return "%s(%r)" % (self.__class__.__name__, self._graph_index)

2056

2057

def add_records(self, records, random_id=False):

2058

"""Add multiple records to the index.

2059

2060

This function does not insert data into the Immutable GraphIndex

2061

backing the KnitGraphIndex, instead it prepares data for insertion by

2062

the caller and checks that it is safe to insert then calls

2063

self._add_callback with the prepared GraphIndex nodes.

2064

2065

:param records: a list of tuples:

2066

(key, options, access_memo, parents).

2067

:param random_id: If True the ids being added were randomly generated

2068

and no check for existence will be performed.

2069

"""

2070

if not self._add_callback:

2071

raise errors.ReadOnlyError(self)

2072

# we hope there are no repositories with inconsistent parentage

2073

# anymore.

2074

2075

keys = {}

2076

for (key, options, access_memo, parents) in records:

2077

if self._parents:

2078

parents = tuple(parents)

2079

index, pos, size = access_memo

2080

if 'no-eol' in options:

2081

value = 'N'

2082

else:

2083

value = ' '

2084

value += "%d %d" % (pos, size)

2085

if not self._deltas:

2086

if 'line-delta' in options:

2087

raise KnitCorrupt(self, "attempt to add line-delta in non-delta knit")

2088

if self._parents:

2089

if self._deltas:

2090

if 'line-delta' in options:

2091

node_refs = (parents, (parents[0],))

2092

else:

2093

node_refs = (parents, ())

2094

else:

2095

node_refs = (parents, )

2096

else:

2097

if parents:

2098

raise KnitCorrupt(self, "attempt to add node with parents "

2099

"in parentless index.")

2100

node_refs = ()

2101

keys[key] = (value, node_refs)

2102

# check for dups

2103

if not random_id:

2104

present_nodes = self._get_entries(keys)

2105

for (index, key, value, node_refs) in present_nodes:

2106

if (value[0] != keys[key][0][0] or

2107

node_refs != keys[key][1]):

2108

raise KnitCorrupt(self, "inconsistent details in add_records"

2109

": %s %s" % ((value, node_refs), keys[key]))

2110

del keys[key]

2111

result = []

2112

if self._parents:

2113

for key, (value, node_refs) in keys.iteritems():

2114

result.append((key, value, node_refs))

2115

else:

2116

for key, (value, node_refs) in keys.iteritems():

2117

result.append((key, value))

2118

self._add_callback(result)

2119

2120

def _check_read(self):

2121

"""raise if reads are not permitted."""

2122

if not self._is_locked():

2123

raise errors.ObjectNotLocked(self)

2124

2125

def _check_write_ok(self):

2126

"""Assert if writes are not permitted."""

2127

if not self._is_locked():

2128

raise errors.ObjectNotLocked(self)

2129

2130

def _compression_parent(self, an_entry):

2131

# return the key that an_entry is compressed against, or None

2132

# Grab the second parent list (as deltas implies parents currently)

2133

compression_parents = an_entry[3][1]

2134

if not compression_parents:

2135

return None

2136

if len(compression_parents) != 1:

2137

raise AssertionError(

2138

"Too many compression parents: %r" % compression_parents)

2139

return compression_parents[0]

2140

2141

def get_build_details(self, keys):

2142

"""Get the method, index_memo and compression parent for version_ids.

2143

2144

Ghosts are omitted from the result.

2145

2146

:param keys: An iterable of keys.

2147

:return: A dict of key:

2148

(index_memo, compression_parent, parents, record_details).

2149

index_memo

2150

opaque structure to pass to read_records to extract the raw

2151

data

2152

compression_parent

2153

Content that this record is built upon, may be None

2154

parents

2155

Logical parents of this node

2156

record_details

2157

extra information about the content which needs to be passed to

2158

Factory.parse_record

2159

"""

2160

self._check_read()

2161

result = {}

2162

entries = self._get_entries(keys, False)

2163

for entry in entries:

2164

key = entry[1]

2165

if not self._parents:

2166

parents = ()

2167

else:

2168

parents = entry[3][0]

2169

if not self._deltas:

2170

compression_parent_key = None

2171

else:

2172

compression_parent_key = self._compression_parent(entry)

2173

noeol = (entry[2][0] == 'N')

2174

if compression_parent_key:

2175

method = 'line-delta'

2176

else:

2177

method = 'fulltext'

2178

result[key] = (self._node_to_position(entry),

2179

compression_parent_key, parents,

2180

(method, noeol))

2181

return result

2182

2183

def _get_entries(self, keys, check_present=False):

2184

"""Get the entries for keys.

2185

2186

:param keys: An iterable of index key tuples.

2187

"""

2188

keys = set(keys)

2189

found_keys = set()

2190

if self._parents:

2191

for node in self._graph_index.iter_entries(keys):

2192

yield node

2193

found_keys.add(node[1])

2194

else:

2195

# adapt parentless index to the rest of the code.

2196

for node in self._graph_index.iter_entries(keys):

2197

yield node[0], node[1], node[2], ()

2198

found_keys.add(node[1])

2199

if check_present:

2200

missing_keys = keys.difference(found_keys)

2201

if missing_keys:

2202

raise RevisionNotPresent(missing_keys.pop(), self)

2203

2204

def get_method(self, key):

2205

"""Return compression method of specified key."""

2206

return self._get_method(self._get_node(key))

2207

2208

def _get_method(self, node):

2209

if not self._deltas:

2210

return 'fulltext'

2211

if self._compression_parent(node):

2212

return 'line-delta'

2213

else:

2214

return 'fulltext'

2215

2216

def _get_node(self, key):

2217

try:

2218

return list(self._get_entries([key]))[0]

2219

except IndexError:

2220

raise RevisionNotPresent(key, self)

2221

2222

def get_options(self, key):

2223

"""Return a list representing options.

2224

2225

e.g. ['foo', 'bar']

2226

"""

2227

node = self._get_node(key)

2228

options = [self._get_method(node)]

2229

if node[2][0] == 'N':

2230

options.append('no-eol')

2231

return options

2232

2233

def get_parent_map(self, keys):

2234

"""Get a map of the parents of keys.

2235

2236

:param keys: The keys to look up parents for.

2237

:return: A mapping from keys to parents. Absent keys are absent from

2238

the mapping.

2239

"""

2240

self._check_read()

2241

nodes = self._get_entries(keys)

2242

result = {}

2243

if self._parents:

2244

for node in nodes:

2245

result[node[1]] = node[3][0]

2246

else:

2247

for node in nodes:

2248

result[node[1]] = None

2249

return result

2250

2251

def get_position(self, key):

2252

"""Return details needed to access the version.

2253

2254

:return: a tuple (index, data position, size) to hand to the access

2255

logic to get the record.

2256

"""

2257

node = self._get_node(key)

2258

return self._node_to_position(node)

2259

2260

def keys(self):

2261

"""Get all the keys in the collection.

2262

2263

The keys are not ordered.

2264

"""

2265

self._check_read()

2266

return [node[1] for node in self._graph_index.iter_all_entries()]

2267

2268

def _node_to_position(self, node):

2269

"""Convert an index value to position details."""

2270

bits = node[2][1:].split(' ')

2271

return node[0], int(bits[0]), int(bits[1])

2272

2273

2274

class _KnitKeyAccess(object):

2275

"""Access to records in .knit files."""

2276

2277

def __init__(self, transport, mapper):

2278

"""Create a _KnitKeyAccess with transport and mapper.

2279

2280

:param transport: The transport the access object is rooted at.

2281

:param mapper: The mapper used to map keys to .knit files.

2282

"""

2283

self._transport = transport

2284

self._mapper = mapper

2285

2286

def add_raw_records(self, key_sizes, raw_data):

2287

"""Add raw knit bytes to a storage area.

2288

2289

The data is spooled to the container writer in one bytes-record per

2290

raw data item.

2291

2292

:param sizes: An iterable of tuples containing the key and size of each

2293

raw data segment.

2294

:param raw_data: A bytestring containing the data.

2295

:return: A list of memos to retrieve the record later. Each memo is an

2296

opaque index memo. For _KnitKeyAccess the memo is (key, pos,

2297

length), where the key is the record key.

2298

"""

2299

if type(raw_data) != str:

2300

raise AssertionError(

2301

'data must be plain bytes was %s' % type(raw_data))

2302

result = []

2303

offset = 0

2304

# TODO: This can be tuned for writing to sftp and other servers where

2305

# append() is relatively expensive by grouping the writes to each key

2306

# prefix.

2307

for key, size in key_sizes:

2308

path = self._mapper.map(key)

2309

try:

2310

base = self._transport.append_bytes(path + '.knit',

2311

raw_data[offset:offset+size])

2312

except errors.NoSuchFile:

2313

self._transport.mkdir(osutils.dirname(path))

2314

base = self._transport.append_bytes(path + '.knit',

2315

raw_data[offset:offset+size])

2316

# if base == 0:

2317

# chmod.

2318

offset += size

2319

result.append((key, base, size))

2320

return result

2321

2322

def get_raw_records(self, memos_for_retrieval):

2323

"""Get the raw bytes for a records.

2324

2325

:param memos_for_retrieval: An iterable containing the access memo for

2326

retrieving the bytes.

2327

:return: An iterator over the bytes of the records.

2328

"""

2329

# first pass, group into same-index request to minimise readv's issued.

2330

request_lists = []

2331

current_prefix = None

2332

for (key, offset, length) in memos_for_retrieval:

2333

if current_prefix == key[:-1]:

2334

current_list.append((offset, length))

2335

else:

2336

if current_prefix is not None:

2337

request_lists.append((current_prefix, current_list))

2338

current_prefix = key[:-1]

2339

current_list = [(offset, length)]

2340

# handle the last entry

2341

if current_prefix is not None:

2342

request_lists.append((current_prefix, current_list))

2343

for prefix, read_vector in request_lists:

2344

path = self._mapper.map(prefix) + '.knit'

2345

for pos, data in self._transport.readv(path, read_vector):

2346

yield data

2347

2348

2349

class _DirectPackAccess(object):

2350

"""Access to data in one or more packs with less translation."""

2351

2352

def __init__(self, index_to_packs):

2353

"""Create a _DirectPackAccess object.

2354

2355

:param index_to_packs: A dict mapping index objects to the transport

2356

and file names for obtaining data.

2357

"""

2358

self._container_writer = None

2359

self._write_index = None

2360

self._indices = index_to_packs

2361

2362

def add_raw_records(self, key_sizes, raw_data):

2363

"""Add raw knit bytes to a storage area.

2364

2365

The data is spooled to the container writer in one bytes-record per

2366

raw data item.

2367

2368

:param sizes: An iterable of tuples containing the key and size of each

2369

raw data segment.

2370

:param raw_data: A bytestring containing the data.

2371

:return: A list of memos to retrieve the record later. Each memo is an

2372

opaque index memo. For _DirectPackAccess the memo is (index, pos,

2373

length), where the index field is the write_index object supplied

2374

to the PackAccess object.

2375

"""

2376

if type(raw_data) != str:

2377

raise AssertionError(

2378

'data must be plain bytes was %s' % type(raw_data))

2379

result = []

2380

offset = 0

2381

for key, size in key_sizes:

2382

p_offset, p_length = self._container_writer.add_bytes_record(

2383

raw_data[offset:offset+size], [])

2384

offset += size

2385

result.append((self._write_index, p_offset, p_length))

2386

return result

2387

2388

def get_raw_records(self, memos_for_retrieval):

2389

"""Get the raw bytes for a records.

2390

2391

:param memos_for_retrieval: An iterable containing the (index, pos,

2392

length) memo for retrieving the bytes. The Pack access method

2393

looks up the pack to use for a given record in its index_to_pack

2394

map.

2395

:return: An iterator over the bytes of the records.

2396

"""

2397

# first pass, group into same-index requests

2398

request_lists = []

2399

current_index = None

2400

for (index, offset, length) in memos_for_retrieval:

2401

if current_index == index:

2402

current_list.append((offset, length))

2403

else:

2404

if current_index is not None:

2405

request_lists.append((current_index, current_list))

2406

current_index = index

2407

current_list = [(offset, length)]

2408

# handle the last entry

2409

if current_index is not None:

2410

request_lists.append((current_index, current_list))

2411

for index, offsets in request_lists:

2412

transport, path = self._indices[index]

2413

reader = pack.make_readv_reader(transport, path, offsets)

2414

for names, read_func in reader.iter_records():

2415

yield read_func(None)

2416

2417

def set_writer(self, writer, index, transport_packname):

2418

"""Set a writer to use for adding data."""

2419

if index is not None:

2420

self._indices[index] = transport_packname

2421

self._container_writer = writer

2422

self._write_index = index

2423

2424

2425

# Deprecated, use PatienceSequenceMatcher instead

2426

KnitSequenceMatcher = patiencediff.PatienceSequenceMatcher

2427

2428

2429

def annotate_knit(knit, revision_id):

2430

"""Annotate a knit with no cached annotations.

2431

2432

This implementation is for knits with no cached annotations.

2433

It will work for knits with cached annotations, but this is not

2434

recommended.

2435

"""

2436

annotator = _KnitAnnotator(knit)

2437

return iter(annotator.annotate(revision_id))

2438

2439

2440

class _KnitAnnotator(object):

2441

"""Build up the annotations for a text."""

2442

2443

def __init__(self, knit):

2444

self._knit = knit

2445

2446

# Content objects, differs from fulltexts because of how final newlines

2447

# are treated by knits. the content objects here will always have a

2448

# final newline

2449

self._fulltext_contents = {}

2450

2451

# Annotated lines of specific revisions

2452

self._annotated_lines = {}

2453

2454

# Track the raw data for nodes that we could not process yet.

2455

# This maps the revision_id of the base to a list of children that will

2456

# annotated from it.

2457

self._pending_children = {}

2458

2459

# Nodes which cannot be extracted

2460

self._ghosts = set()

2461

2462

# Track how many children this node has, so we know if we need to keep

2463

# it

2464

self._annotate_children = {}

2465

self._compression_children = {}

2466

2467

self._all_build_details = {}

2468

# The children => parent revision_id graph

2469

self._revision_id_graph = {}

2470

2471

self._heads_provider = None

2472

2473

self._nodes_to_keep_annotations = set()

2474

self._generations_until_keep = 100

2475

2476

def set_generations_until_keep(self, value):

2477

"""Set the number of generations before caching a node.

2478

2479

Setting this to -1 will cache every merge node, setting this higher

2480

will cache fewer nodes.

2481

"""

2482

self._generations_until_keep = value

2483

2484

def _add_fulltext_content(self, revision_id, content_obj):

2485

self._fulltext_contents[revision_id] = content_obj

2486

# TODO: jam 20080305 It might be good to check the sha1digest here

2487

return content_obj.text()

2488

2489

def _check_parents(self, child, nodes_to_annotate):

2490

"""Check if all parents have been processed.

2491

2492

:param child: A tuple of (rev_id, parents, raw_content)

2493

:param nodes_to_annotate: If child is ready, add it to

2494

nodes_to_annotate, otherwise put it back in self._pending_children

2495

"""

2496

for parent_id in child[1]:

2497

if (parent_id not in self._annotated_lines):

2498

# This parent is present, but another parent is missing

2499

self._pending_children.setdefault(parent_id,

2500

[]).append(child)

2501

break

2502

else:

2503

# This one is ready to be processed

2504

nodes_to_annotate.append(child)

2505

2506

def _add_annotation(self, revision_id, fulltext, parent_ids,

2507

left_matching_blocks=None):

2508

"""Add an annotation entry.

2509

2510

All parents should already have been annotated.

2511

:return: A list of children that now have their parents satisfied.

2512

"""

2513

a = self._annotated_lines

2514

annotated_parent_lines = [a[p] for p in parent_ids]

2515

annotated_lines = list(annotate.reannotate(annotated_parent_lines,

2516

fulltext, revision_id, left_matching_blocks,

2517

heads_provider=self._get_heads_provider()))

2518

self._annotated_lines[revision_id] = annotated_lines

2519

for p in parent_ids:

2520

ann_children = self._annotate_children[p]

2521

ann_children.remove(revision_id)

2522

if (not ann_children

2523

and p not in self._nodes_to_keep_annotations):

2524

del self._annotated_lines[p]

2525

del self._all_build_details[p]

2526

if p in self._fulltext_contents:

2527

del self._fulltext_contents[p]

2528

# Now that we've added this one, see if there are any pending

2529

# deltas to be done, certainly this parent is finished

2530

nodes_to_annotate = []

2531

for child in self._pending_children.pop(revision_id, []):

2532

self._check_parents(child, nodes_to_annotate)

2533

return nodes_to_annotate

2534

2535

def _get_build_graph(self, key):

2536

"""Get the graphs for building texts and annotations.

2537

2538

The data you need for creating a full text may be different than the

2539

data you need to annotate that text. (At a minimum, you need both

2540

parents to create an annotation, but only need 1 parent to generate the

2541

fulltext.)

2542

2543

:return: A list of (key, index_memo) records, suitable for

2544

passing to read_records_iter to start reading in the raw data fro/

2545

the pack file.

2546

"""

2547

if key in self._annotated_lines:

2548

# Nothing to do

2549

return []

2550

pending = set([key])

2551

records = []

2552

generation = 0

2553

kept_generation = 0

2554

while pending:

2555

# get all pending nodes

2556

generation += 1

2557

this_iteration = pending

2558

build_details = self._knit._index.get_build_details(this_iteration)

2559

self._all_build_details.update(build_details)

2560

# new_nodes = self._knit._index._get_entries(this_iteration)

2561

pending = set()

2562

for key, details in build_details.iteritems():

2563

(index_memo, compression_parent, parents,

2564

record_details) = details

2565

self._revision_id_graph[key] = parents

2566

records.append((key, index_memo))

2567

# Do we actually need to check _annotated_lines?

2568

pending.update(p for p in parents

2569

if p not in self._all_build_details)

2570

if compression_parent:

2571

self._compression_children.setdefault(compression_parent,

2572

[]).append(key)

2573

if parents:

2574

for parent in parents:

2575

self._annotate_children.setdefault(parent,

2576

[]).append(key)

2577

num_gens = generation - kept_generation

2578

if ((num_gens >= self._generations_until_keep)

2579

and len(parents) > 1):

2580

kept_generation = generation

2581

self._nodes_to_keep_annotations.add(key)

2582

2583

missing_versions = this_iteration.difference(build_details.keys())

2584

self._ghosts.update(missing_versions)

2585

for missing_version in missing_versions:

2586

# add a key, no parents

2587

self._revision_id_graph[missing_version] = ()

2588

pending.discard(missing_version) # don't look for it

2589

if self._ghosts.intersection(self._compression_children):

2590

raise KnitCorrupt(

2591

"We cannot have nodes which have a ghost compression parent:\n"

2592

"ghosts: %r\n"

2593

"compression children: %r"

2594

% (self._ghosts, self._compression_children))

2595

# Cleanout anything that depends on a ghost so that we don't wait for

2596

# the ghost to show up

2597

for node in self._ghosts:

2598

if node in self._annotate_children:

2599

# We won't be building this node

2600

del self._annotate_children[node]

2601

# Generally we will want to read the records in reverse order, because

2602

# we find the parent nodes after the children

2603

records.reverse()

2604

return records

2605

2606

def _annotate_records(self, records):

2607

"""Build the annotations for the listed records."""

2608

# We iterate in the order read, rather than a strict order requested

2609

# However, process what we can, and put off to the side things that

2610

# still need parents, cleaning them up when those parents are

2611

# processed.

2612

for (rev_id, record,

2613

digest) in self._knit._read_records_iter(records):

2614

if rev_id in self._annotated_lines:

2615

continue

2616

parent_ids = self._revision_id_graph[rev_id]

2617

parent_ids = [p for p in parent_ids if p not in self._ghosts]

2618

details = self._all_build_details[rev_id]

2619

(index_memo, compression_parent, parents,

2620

record_details) = details

2621

nodes_to_annotate = []

2622

# TODO: Remove the punning between compression parents, and

2623

# parent_ids, we should be able to do this without assuming

2624

# the build order

2625

if len(parent_ids) == 0:

2626

# There are no parents for this node, so just add it

2627

# TODO: This probably needs to be decoupled

2628

fulltext_content, delta = self._knit._factory.parse_record(

2629

rev_id, record, record_details, None)

2630

fulltext = self._add_fulltext_content(rev_id, fulltext_content)

2631

nodes_to_annotate.extend(self._add_annotation(rev_id, fulltext,

2632

parent_ids, left_matching_blocks=None))

2633

else:

2634

child = (rev_id, parent_ids, record)

2635

# Check if all the parents are present

2636

self._check_parents(child, nodes_to_annotate)

2637

while nodes_to_annotate:

2638

# Should we use a queue here instead of a stack?

2639

(rev_id, parent_ids, record) = nodes_to_annotate.pop()

2640

(index_memo, compression_parent, parents,

2641

record_details) = self._all_build_details[rev_id]

2642

if compression_parent is not None:

2643

comp_children = self._compression_children[compression_parent]

2644

if rev_id not in comp_children:

2645

raise AssertionError("%r not in compression children %r"

2646

% (rev_id, comp_children))

2647

# If there is only 1 child, it is safe to reuse this

2648

# content

2649

reuse_content = (len(comp_children) == 1

2650

and compression_parent not in

2651

self._nodes_to_keep_annotations)

2652

if reuse_content:

2653

# Remove it from the cache since it will be changing

2654

parent_fulltext_content = self._fulltext_contents.pop(compression_parent)

2655

# Make sure to copy the fulltext since it might be

2656

# modified

2657

parent_fulltext = list(parent_fulltext_content.text())

2658

else:

2659

parent_fulltext_content = self._fulltext_contents[compression_parent]

2660

parent_fulltext = parent_fulltext_content.text()

2661

comp_children.remove(rev_id)

2662

fulltext_content, delta = self._knit._factory.parse_record(

2663

rev_id, record, record_details,

2664

parent_fulltext_content,

2665

copy_base_content=(not reuse_content))

2666

fulltext = self._add_fulltext_content(rev_id,

2667

fulltext_content)

2668

blocks = KnitContent.get_line_delta_blocks(delta,

2669

parent_fulltext, fulltext)

2670

else:

2671

fulltext_content = self._knit._factory.parse_fulltext(

2672

record, rev_id)

2673

fulltext = self._add_fulltext_content(rev_id,

2674

fulltext_content)

2675

blocks = None

2676

nodes_to_annotate.extend(

2677

self._add_annotation(rev_id, fulltext, parent_ids,

2678

left_matching_blocks=blocks))

2679

2680

def _get_heads_provider(self):

2681

"""Create a heads provider for resolving ancestry issues."""

2682

if self._heads_provider is not None:

2683

return self._heads_provider

2684

parent_provider = _mod_graph.DictParentsProvider(

2685

self._revision_id_graph)

2686

graph_obj = _mod_graph.Graph(parent_provider)

2687

head_cache = _mod_graph.FrozenHeadsCache(graph_obj)

2688

self._heads_provider = head_cache

2689

return head_cache

2690

2691

def annotate(self, key):

2692

"""Return the annotated fulltext at the given key.

2693

2694

:param key: The key to annotate.

2695

"""

2696

if True or len(self._knit._fallback_vfs) > 0:

2697

# stacked knits can't use the fast path at present.

2698

return self._simple_annotate(key)

2699

records = self._get_build_graph(key)

2700

if key in self._ghosts:

2701

raise errors.RevisionNotPresent(key, self._knit)

2702

self._annotate_records(records)

2703

return self._annotated_lines[key]

2704

2705

def _simple_annotate(self, key):

2706

"""Return annotated fulltext, rediffing from the full texts.

2707

2708

This is slow but makes no assumptions about the repository

2709

being able to produce line deltas.

2710

"""

2711

# TODO: this code generates a parent maps of present ancestors; it

2712

# could be split out into a separate method, and probably should use

2713

# iter_ancestry instead. -- mbp and robertc 20080704

2714

graph = _mod_graph.Graph(self._knit)

2715

head_cache = _mod_graph.FrozenHeadsCache(graph)

2716

search = graph._make_breadth_first_searcher([key])

2717

keys = set()

2718

while True:

2719

try:

2720

present, ghosts = search.next_with_ghosts()

2721

except StopIteration:

2722

break

2723

keys.update(present)

2724

parent_map = self._knit.get_parent_map(keys)

2725

parent_cache = {}

2726

reannotate = annotate.reannotate

2727

for record in self._knit.get_record_stream(keys, 'topological', True):

2728

key = record.key

2729

fulltext = split_lines(record.get_bytes_as('fulltext'))

2730

parents = parent_map[key]

2731

if parents is not None:

2732

parent_lines = [parent_cache[parent] for parent in parent_map[key]]

2733

else:

2734

parent_lines = []

2735

parent_cache[key] = list(

2736

reannotate(parent_lines, fulltext, key, None, head_cache))

2737

try:

2738

return parent_cache[key]

2739

except KeyError, e:

2740

raise errors.RevisionNotPresent(key, self._knit)

2741

2742

2743

try:

2744

from bzrlib._knit_load_data_c import _load_data_c as _load_data

2745

except ImportError:

2746

from bzrlib._knit_load_data_py import _load_data_py as _load_data

Older »