/brz/remove-bazaar : revision 3350.6.4

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/repofmt/pack_repo.py

Committer: Robert Collins
Date: 2008-06-11 04:20:16 UTC
mto: (3221.12.10 Development1) (3517.4.1 annotate)
mto: This revision was merged to the branch mainline in revision 3510.
Revision ID: robertc@robertcollins.net-20080611042016-661dds0v1rjz542g

First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bzr_access

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/revnos.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

tools/win32/survey.txt

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/repofmt/pack_repo.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from itertools import izip

import math

import md5

import time

from bzrlib import (

debug,

graph,

pack,

ui,

)

from bzrlib.index import (

GraphIndex,

GraphIndexBuilder,

InMemoryGraphIndex,

CombinedGraphIndex,

GraphIndexPrefixAdapter,

)

from bzrlib.knit import (

KnitPlainFactory,

KnitVersionedFiles,

_KnitGraphIndex,

_DirectPackAccess,

)

from bzrlib.osutils import rand_chars, split_lines

from bzrlib.pack import ContainerWriter

from bzrlib.store import revision

from bzrlib import tsort

""")

from bzrlib import (

bzrdir,

errors,

lockable_files,

lockdir,

osutils,

symbol_versioning,

transactions,

xml5,

xml6,

xml7,

)

from bzrlib.decorators import needs_read_lock, needs_write_lock

from bzrlib.repofmt.knitrepo import KnitRepository

from bzrlib.repository import (

CommitBuilder,

MetaDirRepository,

MetaDirRepositoryFormat,

RepositoryFormat,

RootCommitBuilder,

)

import bzrlib.revision as _mod_revision

from bzrlib.store.versioned import VersionedFileStore

from bzrlib.trace import (

mutter,

mutter_callsite,

note,

warning,

)

class PackCommitBuilder(CommitBuilder):

"""A subclass of CommitBuilder to add texts with pack semantics.

Specifically this uses one knit object rather than one knit object per

added text, reducing memory and object pressure.

"""

def __init__(self, repository, parents, config, timestamp=None,

timezone=None, committer=None, revprops=None,

revision_id=None):

CommitBuilder.__init__(self, repository, parents, config,

timestamp=timestamp, timezone=timezone, committer=committer,

revprops=revprops, revision_id=revision_id)

self._file_graph = graph.Graph(

repository._pack_collection.text_index.combined_index)

def _heads(self, file_id, revision_ids):

keys = [(file_id, revision_id) for revision_id in revision_ids]

return set([key[1] for key in self._file_graph.heads(keys)])

100

101

class PackRootCommitBuilder(RootCommitBuilder):

102

"""A subclass of RootCommitBuilder to add texts with pack semantics.

103

104

Specifically this uses one knit object rather than one knit object per

105

added text, reducing memory and object pressure.

106

"""

107

108

def __init__(self, repository, parents, config, timestamp=None,

109

timezone=None, committer=None, revprops=None,

110

revision_id=None):

111

CommitBuilder.__init__(self, repository, parents, config,

112

timestamp=timestamp, timezone=timezone, committer=committer,

113

revprops=revprops, revision_id=revision_id)

114

self._file_graph = graph.Graph(

115

repository._pack_collection.text_index.combined_index)

116

117

def _heads(self, file_id, revision_ids):

118

keys = [(file_id, revision_id) for revision_id in revision_ids]

119

return set([key[1] for key in self._file_graph.heads(keys)])

120

121

122

class Pack(object):

123

"""An in memory proxy for a pack and its indices.

124

125

This is a base class that is not directly used, instead the classes

126

ExistingPack and NewPack are used.

127

"""

128

129

def __init__(self, revision_index, inventory_index, text_index,

130

signature_index):

131

"""Create a pack instance.

132

133

:param revision_index: A GraphIndex for determining what revisions are

134

present in the Pack and accessing the locations of their texts.

135

:param inventory_index: A GraphIndex for determining what inventories are

136

present in the Pack and accessing the locations of their

137

texts/deltas.

138

:param text_index: A GraphIndex for determining what file texts

139

are present in the pack and accessing the locations of their

140

texts/deltas (via (fileid, revisionid) tuples).

141

:param revision_index: A GraphIndex for determining what signatures are

142

present in the Pack and accessing the locations of their texts.

143

"""

144

self.revision_index = revision_index

145

self.inventory_index = inventory_index

146

self.text_index = text_index

147

self.signature_index = signature_index

148

149

def access_tuple(self):

150

"""Return a tuple (transport, name) for the pack content."""

151

return self.pack_transport, self.file_name()

152

153

def file_name(self):

154

"""Get the file name for the pack on disk."""

155

return self.name + '.pack'

156

157

def get_revision_count(self):

158

return self.revision_index.key_count()

159

160

def inventory_index_name(self, name):

161

"""The inv index is the name + .iix."""

162

return self.index_name('inventory', name)

163

164

def revision_index_name(self, name):

165

"""The revision index is the name + .rix."""

166

return self.index_name('revision', name)

167

168

def signature_index_name(self, name):

169

"""The signature index is the name + .six."""

170

return self.index_name('signature', name)

171

172

def text_index_name(self, name):

173

"""The text index is the name + .tix."""

174

return self.index_name('text', name)

175

176

def _external_compression_parents_of_texts(self):

177

keys = set()

178

refs = set()

179

for node in self.text_index.iter_all_entries():

180

keys.add(node[1])

181

refs.update(node[3][1])

182

return refs - keys

183

184

185

class ExistingPack(Pack):

186

"""An in memory proxy for an existing .pack and its disk indices."""

187

188

def __init__(self, pack_transport, name, revision_index, inventory_index,

189

text_index, signature_index):

190

"""Create an ExistingPack object.

191

192

:param pack_transport: The transport where the pack file resides.

193

:param name: The name of the pack on disk in the pack_transport.

194

"""

195

Pack.__init__(self, revision_index, inventory_index, text_index,

196

signature_index)

197

self.name = name

198

self.pack_transport = pack_transport

199

if None in (revision_index, inventory_index, text_index,

200

signature_index, name, pack_transport):

201

raise AssertionError()

202

203

def __eq__(self, other):

204

return self.__dict__ == other.__dict__

205

206

def __ne__(self, other):

207

return not self.__eq__(other)

208

209

def __repr__(self):

210

return "<bzrlib.repofmt.pack_repo.Pack object at 0x%x, %s, %s" % (

211

id(self), self.transport, self.name)

212

213

214

class NewPack(Pack):

215

"""An in memory proxy for a pack which is being created."""

216

217

# A map of index 'type' to the file extension and position in the

218

# index_sizes array.

219

index_definitions = {

220

'revision': ('.rix', 0),

221

'inventory': ('.iix', 1),

222

'text': ('.tix', 2),

223

'signature': ('.six', 3),

224

}

225

226

def __init__(self, upload_transport, index_transport, pack_transport,

227

upload_suffix='', file_mode=None):

228

"""Create a NewPack instance.

229

230

:param upload_transport: A writable transport for the pack to be

231

incrementally uploaded to.

232

:param index_transport: A writable transport for the pack's indices to

233

be written to when the pack is finished.

234

:param pack_transport: A writable transport for the pack to be renamed

235

to when the upload is complete. This *must* be the same as

236

upload_transport.clone('../packs').

237

:param upload_suffix: An optional suffix to be given to any temporary

238

files created during the pack creation. e.g '.autopack'

239

:param file_mode: An optional file mode to create the new files with.

240

"""

241

# The relative locations of the packs are constrained, but all are

242

# passed in because the caller has them, so as to avoid object churn.

243

Pack.__init__(self,

244

# Revisions: parents list, no text compression.

245

InMemoryGraphIndex(reference_lists=1),

246

# Inventory: We want to map compression only, but currently the

247

# knit code hasn't been updated enough to understand that, so we

248

# have a regular 2-list index giving parents and compression

249

# source.

250

InMemoryGraphIndex(reference_lists=2),

251

# Texts: compression and per file graph, for all fileids - so two

252

# reference lists and two elements in the key tuple.

253

InMemoryGraphIndex(reference_lists=2, key_elements=2),

254

# Signatures: Just blobs to store, no compression, no parents

255

# listing.

256

InMemoryGraphIndex(reference_lists=0),

257

)

258

# where should the new pack be opened

259

self.upload_transport = upload_transport

260

# where are indices written out to

261

self.index_transport = index_transport

262

# where is the pack renamed to when it is finished?

263

self.pack_transport = pack_transport

264

# What file mode to upload the pack and indices with.

265

self._file_mode = file_mode

266

# tracks the content written to the .pack file.

267

self._hash = md5.new()

268

# a four-tuple with the length in bytes of the indices, once the pack

269

# is finalised. (rev, inv, text, sigs)

270

self.index_sizes = None

271

# How much data to cache when writing packs. Note that this is not

272

# synchronised with reads, because it's not in the transport layer, so

273

# is not safe unless the client knows it won't be reading from the pack

274

# under creation.

275

self._cache_limit = 0

276

# the temporary pack file name.

277

self.random_name = rand_chars(20) + upload_suffix

278

# when was this pack started ?

279

self.start_time = time.time()

280

# open an output stream for the data added to the pack.

281

self.write_stream = self.upload_transport.open_write_stream(

282

self.random_name, mode=self._file_mode)

283

if 'pack' in debug.debug_flags:

284

mutter('%s: create_pack: pack stream open: %s%s t+%6.3fs',

285

time.ctime(), self.upload_transport.base, self.random_name,

286

time.time() - self.start_time)

287

# A list of byte sequences to be written to the new pack, and the

288

# aggregate size of them. Stored as a list rather than separate

289

# variables so that the _write_data closure below can update them.

290

self._buffer = [[], 0]

291

# create a callable for adding data

292

293

# robertc says- this is a closure rather than a method on the object

294

# so that the variables are locals, and faster than accessing object

295

# members.

296

def _write_data(bytes, flush=False, _buffer=self._buffer,

297

_write=self.write_stream.write, _update=self._hash.update):

298

_buffer[0].append(bytes)

299

_buffer[1] += len(bytes)

300

# buffer cap

301

if _buffer[1] > self._cache_limit or flush:

302

bytes = ''.join(_buffer[0])

303

_write(bytes)

304

_update(bytes)

305

_buffer[:] = [[], 0]

306

# expose this on self, for the occasion when clients want to add data.

307

self._write_data = _write_data

308

# a pack writer object to serialise pack records.

309

self._writer = pack.ContainerWriter(self._write_data)

310

self._writer.begin()

311

# what state is the pack in? (open, finished, aborted)

312

self._state = 'open'

313

314

def abort(self):

315

"""Cancel creating this pack."""

316

self._state = 'aborted'

317

self.write_stream.close()

318

# Remove the temporary pack file.

319

self.upload_transport.delete(self.random_name)

320

# The indices have no state on disk.

321

322

def access_tuple(self):

323

"""Return a tuple (transport, name) for the pack content."""

324

if self._state == 'finished':

325

return Pack.access_tuple(self)

326

elif self._state == 'open':

327

return self.upload_transport, self.random_name

328

else:

329

raise AssertionError(self._state)

330

331

def data_inserted(self):

332

"""True if data has been added to this pack."""

333

return bool(self.get_revision_count() or

334

self.inventory_index.key_count() or

335

self.text_index.key_count() or

336

self.signature_index.key_count())

337

338

def finish(self):

339

"""Finish the new pack.

340

341

This:

342

- finalises the content

343

- assigns a name (the md5 of the content, currently)

344

- writes out the associated indices

345

- renames the pack into place.

346

- stores the index size tuple for the pack in the index_sizes

347

attribute.

348

"""

349

self._writer.end()

350

if self._buffer[1]:

351

self._write_data('', flush=True)

352

self.name = self._hash.hexdigest()

353

# write indices

354

# XXX: It'd be better to write them all to temporary names, then

355

# rename them all into place, so that the window when only some are

356

# visible is smaller. On the other hand none will be seen until

357

# they're in the names list.

358

self.index_sizes = [None, None, None, None]

359

self._write_index('revision', self.revision_index, 'revision')

360

self._write_index('inventory', self.inventory_index, 'inventory')

361

self._write_index('text', self.text_index, 'file texts')

362

self._write_index('signature', self.signature_index,

363

'revision signatures')

364

self.write_stream.close()

365

# Note that this will clobber an existing pack with the same name,

366

# without checking for hash collisions. While this is undesirable this

367

# is something that can be rectified in a subsequent release. One way

368

# to rectify it may be to leave the pack at the original name, writing

369

# its pack-names entry as something like 'HASH: index-sizes

370

# temporary-name'. Allocate that and check for collisions, if it is

371

# collision free then rename it into place. If clients know this scheme

372

# they can handle missing-file errors by:

373

# - try for HASH.pack

374

# - try for temporary-name

375

# - refresh the pack-list to see if the pack is now absent

376

self.upload_transport.rename(self.random_name,

377

'../packs/' + self.name + '.pack')

378

self._state = 'finished'

379

if 'pack' in debug.debug_flags:

380

# XXX: size might be interesting?

381

mutter('%s: create_pack: pack renamed into place: %s%s->%s%s t+%6.3fs',

382

time.ctime(), self.upload_transport.base, self.random_name,

383

self.pack_transport, self.name,

384

time.time() - self.start_time)

385

386

def flush(self):

387

"""Flush any current data."""

388

if self._buffer[1]:

389

bytes = ''.join(self._buffer[0])

390

self.write_stream.write(bytes)

391

self._hash.update(bytes)

392

self._buffer[:] = [[], 0]

393

394

def index_name(self, index_type, name):

395

"""Get the disk name of an index type for pack name 'name'."""

396

return name + NewPack.index_definitions[index_type][0]

397

398

def index_offset(self, index_type):

399

"""Get the position in a index_size array for a given index type."""

400

return NewPack.index_definitions[index_type][1]

401

402

def _replace_index_with_readonly(self, index_type):

403

setattr(self, index_type + '_index',

404

GraphIndex(self.index_transport,

405

self.index_name(index_type, self.name),

406

self.index_sizes[self.index_offset(index_type)]))

407

408

def set_write_cache_size(self, size):

409

self._cache_limit = size

410

411

def _write_index(self, index_type, index, label):

412

"""Write out an index.

413

414

:param index_type: The type of index to write - e.g. 'revision'.

415

:param index: The index object to serialise.

416

:param label: What label to give the index e.g. 'revision'.

417

"""

418

index_name = self.index_name(index_type, self.name)

419

self.index_sizes[self.index_offset(index_type)] = \

420

self.index_transport.put_file(index_name, index.finish(),

421

mode=self._file_mode)

422

if 'pack' in debug.debug_flags:

423

# XXX: size might be interesting?

424

mutter('%s: create_pack: wrote %s index: %s%s t+%6.3fs',

425

time.ctime(), label, self.upload_transport.base,

426

self.random_name, time.time() - self.start_time)

427

# Replace the writable index on this object with a readonly,

428

# presently unloaded index. We should alter

429

# the index layer to make its finish() error if add_node is

430

# subsequently used. RBC

431

self._replace_index_with_readonly(index_type)

432

433

434

class AggregateIndex(object):

435

"""An aggregated index for the RepositoryPackCollection.

436

437

AggregateIndex is reponsible for managing the PackAccess object,

438

Index-To-Pack mapping, and all indices list for a specific type of index

439

such as 'revision index'.

440

441

A CombinedIndex provides an index on a single key space built up

442

from several on-disk indices. The AggregateIndex builds on this

443

to provide a knit access layer, and allows having up to one writable

444

index within the collection.

445

"""

446

# XXX: Probably 'can be written to' could/should be separated from 'acts

447

# like a knit index' -- mbp 20071024

448

449

def __init__(self):

450

"""Create an AggregateIndex."""

451

self.index_to_pack = {}

452

self.combined_index = CombinedGraphIndex([])

453

self.data_access = _DirectPackAccess(self.index_to_pack)

454

self.add_callback = None

455

456

def replace_indices(self, index_to_pack, indices):

457

"""Replace the current mappings with fresh ones.

458

459

This should probably not be used eventually, rather incremental add and

460

removal of indices. It has been added during refactoring of existing

461

code.

462

463

:param index_to_pack: A mapping from index objects to

464

(transport, name) tuples for the pack file data.

465

:param indices: A list of indices.

466

"""

467

# refresh the revision pack map dict without replacing the instance.

468

self.index_to_pack.clear()

469

self.index_to_pack.update(index_to_pack)

470

# XXX: API break - clearly a 'replace' method would be good?

471

self.combined_index._indices[:] = indices

472

# the current add nodes callback for the current writable index if

473

# there is one.

474

self.add_callback = None

475

476

def add_index(self, index, pack):

477

"""Add index to the aggregate, which is an index for Pack pack.

478

479

Future searches on the aggregate index will seach this new index

480

before all previously inserted indices.

481

482

:param index: An Index for the pack.

483

:param pack: A Pack instance.

484

"""

485

# expose it to the index map

486

self.index_to_pack[index] = pack.access_tuple()

487

# put it at the front of the linear index list

488

self.combined_index.insert_index(0, index)

489

490

def add_writable_index(self, index, pack):

491

"""Add an index which is able to have data added to it.

492

493

There can be at most one writable index at any time. Any

494

modifications made to the knit are put into this index.

495

496

:param index: An index from the pack parameter.

497

:param pack: A Pack instance.

498

"""

499

if self.add_callback is not None:

500

raise AssertionError(

501

"%s already has a writable index through %s" % \

502

(self, self.add_callback))

503

# allow writing: queue writes to a new index

504

self.add_index(index, pack)

505

# Updates the index to packs mapping as a side effect,

506

self.data_access.set_writer(pack._writer, index, pack.access_tuple())

507

self.add_callback = index.add_nodes

508

509

def clear(self):

510

"""Reset all the aggregate data to nothing."""

511

self.data_access.set_writer(None, None, (None, None))

512

self.index_to_pack.clear()

513

del self.combined_index._indices[:]

514

self.add_callback = None

515

516

def remove_index(self, index, pack):

517

"""Remove index from the indices used to answer queries.

518

519

:param index: An index from the pack parameter.

520

:param pack: A Pack instance.

521

"""

522

del self.index_to_pack[index]

523

self.combined_index._indices.remove(index)

524

if (self.add_callback is not None and

525

getattr(index, 'add_nodes', None) == self.add_callback):

526

self.add_callback = None

527

self.data_access.set_writer(None, None, (None, None))

528

529

530

class Packer(object):

531

"""Create a pack from packs."""

532

533

def __init__(self, pack_collection, packs, suffix, revision_ids=None):

534

"""Create a Packer.

535

536

:param pack_collection: A RepositoryPackCollection object where the

537

new pack is being written to.

538

:param packs: The packs to combine.

539

:param suffix: The suffix to use on the temporary files for the pack.

540

:param revision_ids: Revision ids to limit the pack to.

541

"""

542

self.packs = packs

543

self.suffix = suffix

544

self.revision_ids = revision_ids

545

# The pack object we are creating.

546

self.new_pack = None

547

self._pack_collection = pack_collection

548

# The index layer keys for the revisions being copied. None for 'all

549

# objects'.

550

self._revision_keys = None

551

# What text keys to copy. None for 'all texts'. This is set by

552

# _copy_inventory_texts

553

self._text_filter = None

554

self._extra_init()

555

556

def _extra_init(self):

557

"""A template hook to allow extending the constructor trivially."""

558

559

def pack(self, pb=None):

560

"""Create a new pack by reading data from other packs.

561

562

This does little more than a bulk copy of data. One key difference

563

is that data with the same item key across multiple packs is elided

564

from the output. The new pack is written into the current pack store

565

along with its indices, and the name added to the pack names. The

566

source packs are not altered and are not required to be in the current

567

pack collection.

568

569

:param pb: An optional progress bar to use. A nested bar is created if

570

this is None.

571

:return: A Pack object, or None if nothing was copied.

572

"""

573

# open a pack - using the same name as the last temporary file

574

# - which has already been flushed, so its safe.

575

# XXX: - duplicate code warning with start_write_group; fix before

576

# considering 'done'.

577

if self._pack_collection._new_pack is not None:

578

raise errors.BzrError('call to create_pack_from_packs while '

579

'another pack is being written.')

580

if self.revision_ids is not None:

581

if len(self.revision_ids) == 0:

582

# silly fetch request.

583

return None

584

else:

585

self.revision_ids = frozenset(self.revision_ids)

586

self.revision_keys = frozenset((revid,) for revid in

587

self.revision_ids)

588

if pb is None:

589

self.pb = ui.ui_factory.nested_progress_bar()

590

else:

591

self.pb = pb

592

try:

593

return self._create_pack_from_packs()

594

finally:

595

if pb is None:

596

self.pb.finished()

597

598

def open_pack(self):

599

"""Open a pack for the pack we are creating."""

600

return NewPack(self._pack_collection._upload_transport,

601

self._pack_collection._index_transport,

602

self._pack_collection._pack_transport, upload_suffix=self.suffix,

603

file_mode=self._pack_collection.repo.control_files._file_mode)

604

605

def _copy_revision_texts(self):

606

"""Copy revision data to the new pack."""

607

# select revisions

608

if self.revision_ids:

609

revision_keys = [(revision_id,) for revision_id in self.revision_ids]

610

else:

611

revision_keys = None

612

# select revision keys

613

revision_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

614

self.packs, 'revision_index')[0]

615

revision_nodes = self._pack_collection._index_contents(revision_index_map, revision_keys)

616

# copy revision keys and adjust values

617

self.pb.update("Copying revision texts", 1)

618

total_items, readv_group_iter = self._revision_node_readv(revision_nodes)

619

list(self._copy_nodes_graph(revision_index_map, self.new_pack._writer,

620

self.new_pack.revision_index, readv_group_iter, total_items))

621

if 'pack' in debug.debug_flags:

622

mutter('%s: create_pack: revisions copied: %s%s %d items t+%6.3fs',

623

time.ctime(), self._pack_collection._upload_transport.base,

624

self.new_pack.random_name,

625

self.new_pack.revision_index.key_count(),

626

time.time() - self.new_pack.start_time)

627

self._revision_keys = revision_keys

628

629

def _copy_inventory_texts(self):

630

"""Copy the inventory texts to the new pack.

631

632

self._revision_keys is used to determine what inventories to copy.

633

634

Sets self._text_filter appropriately.

635

"""

636

# select inventory keys

637

inv_keys = self._revision_keys # currently the same keyspace, and note that

638

# querying for keys here could introduce a bug where an inventory item

639

# is missed, so do not change it to query separately without cross

640

# checking like the text key check below.

641

inventory_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

642

self.packs, 'inventory_index')[0]

643

inv_nodes = self._pack_collection._index_contents(inventory_index_map, inv_keys)

644

# copy inventory keys and adjust values

645

# XXX: Should be a helper function to allow different inv representation

646

# at this point.

647

self.pb.update("Copying inventory texts", 2)

648

total_items, readv_group_iter = self._least_readv_node_readv(inv_nodes)

649

# Only grab the output lines if we will be processing them

650

output_lines = bool(self.revision_ids)

651

inv_lines = self._copy_nodes_graph(inventory_index_map,

652

self.new_pack._writer, self.new_pack.inventory_index,

653

readv_group_iter, total_items, output_lines=output_lines)

654

if self.revision_ids:

655

self._process_inventory_lines(inv_lines)

656

else:

657

# eat the iterator to cause it to execute.

658

list(inv_lines)

659

self._text_filter = None

660

if 'pack' in debug.debug_flags:

661

mutter('%s: create_pack: inventories copied: %s%s %d items t+%6.3fs',

662

time.ctime(), self._pack_collection._upload_transport.base,

663

self.new_pack.random_name,

664

self.new_pack.inventory_index.key_count(),

665

time.time() - self.new_pack.start_time)

666

667

def _copy_text_texts(self):

668

# select text keys

669

text_index_map, text_nodes = self._get_text_nodes()

670

if self._text_filter is not None:

671

# We could return the keys copied as part of the return value from

672

# _copy_nodes_graph but this doesn't work all that well with the

673

# need to get line output too, so we check separately, and as we're

674

# going to buffer everything anyway, we check beforehand, which

675

# saves reading knit data over the wire when we know there are

676

# mising records.

677

text_nodes = set(text_nodes)

678

present_text_keys = set(_node[1] for _node in text_nodes)

679

missing_text_keys = set(self._text_filter) - present_text_keys

680

if missing_text_keys:

681

# TODO: raise a specific error that can handle many missing

682

# keys.

683

a_missing_key = missing_text_keys.pop()

684

raise errors.RevisionNotPresent(a_missing_key[1],

685

a_missing_key[0])

686

# copy text keys and adjust values

687

self.pb.update("Copying content texts", 3)

688

total_items, readv_group_iter = self._least_readv_node_readv(text_nodes)

689

list(self._copy_nodes_graph(text_index_map, self.new_pack._writer,

690

self.new_pack.text_index, readv_group_iter, total_items))

691

self._log_copied_texts()

692

693

def _check_references(self):

694

"""Make sure our external refereneces are present."""

695

external_refs = self.new_pack._external_compression_parents_of_texts()

696

if external_refs:

697

index = self._pack_collection.text_index.combined_index

698

found_items = list(index.iter_entries(external_refs))

699

if len(found_items) != len(external_refs):

700

found_keys = set(k for idx, k, refs, value in found_items)

701

missing_items = external_refs - found_keys

702

missing_file_id, missing_revision_id = missing_items.pop()

703

raise errors.RevisionNotPresent(missing_revision_id,

704

missing_file_id)

705

706

def _create_pack_from_packs(self):

707

self.pb.update("Opening pack", 0, 5)

708

self.new_pack = self.open_pack()

709

new_pack = self.new_pack

710

# buffer data - we won't be reading-back during the pack creation and

711

# this makes a significant difference on sftp pushes.

712

new_pack.set_write_cache_size(1024*1024)

713

if 'pack' in debug.debug_flags:

714

plain_pack_list = ['%s%s' % (a_pack.pack_transport.base, a_pack.name)

715

for a_pack in self.packs]

716

if self.revision_ids is not None:

717

rev_count = len(self.revision_ids)

718

else:

719

rev_count = 'all'

720

mutter('%s: create_pack: creating pack from source packs: '

721

'%s%s %s revisions wanted %s t=0',

722

time.ctime(), self._pack_collection._upload_transport.base, new_pack.random_name,

723

plain_pack_list, rev_count)

724

self._copy_revision_texts()

725

self._copy_inventory_texts()

726

self._copy_text_texts()

727

# select signature keys

728

signature_filter = self._revision_keys # same keyspace

729

signature_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

730

self.packs, 'signature_index')[0]

731

signature_nodes = self._pack_collection._index_contents(signature_index_map,

732

signature_filter)

733

# copy signature keys and adjust values

734

self.pb.update("Copying signature texts", 4)

735

self._copy_nodes(signature_nodes, signature_index_map, new_pack._writer,

736

new_pack.signature_index)

737

if 'pack' in debug.debug_flags:

738

mutter('%s: create_pack: revision signatures copied: %s%s %d items t+%6.3fs',

739

time.ctime(), self._pack_collection._upload_transport.base, new_pack.random_name,

740

new_pack.signature_index.key_count(),

741

time.time() - new_pack.start_time)

742

self._check_references()

743

if not self._use_pack(new_pack):

744

new_pack.abort()

745

return None

746

self.pb.update("Finishing pack", 5)

747

new_pack.finish()

748

self._pack_collection.allocate(new_pack)

749

return new_pack

750

751

def _copy_nodes(self, nodes, index_map, writer, write_index):

752

"""Copy knit nodes between packs with no graph references."""

753

pb = ui.ui_factory.nested_progress_bar()

754

try:

755

return self._do_copy_nodes(nodes, index_map, writer,

756

write_index, pb)

757

finally:

758

pb.finished()

759

760

def _do_copy_nodes(self, nodes, index_map, writer, write_index, pb):

761

# for record verification

762

knit = KnitVersionedFiles(None, None)

763

# plan a readv on each source pack:

764

# group by pack

765

nodes = sorted(nodes)

766

# how to map this into knit.py - or knit.py into this?

767

# we don't want the typical knit logic, we want grouping by pack

768

# at this point - perhaps a helper library for the following code

769

# duplication points?

770

request_groups = {}

771

for index, key, value in nodes:

772

if index not in request_groups:

773

request_groups[index] = []

774

request_groups[index].append((key, value))

775

record_index = 0

776

pb.update("Copied record", record_index, len(nodes))

777

for index, items in request_groups.iteritems():

778

pack_readv_requests = []

779

for key, value in items:

780

# ---- KnitGraphIndex.get_position

781

bits = value[1:].split(' ')

782

offset, length = int(bits[0]), int(bits[1])

783

pack_readv_requests.append((offset, length, (key, value[0])))

784

# linear scan up the pack

785

pack_readv_requests.sort()

786

# copy the data

787

transport, path = index_map[index]

788

reader = pack.make_readv_reader(transport, path,

789

[offset[0:2] for offset in pack_readv_requests])

790

for (names, read_func), (_1, _2, (key, eol_flag)) in \

791

izip(reader.iter_records(), pack_readv_requests):

792

raw_data = read_func(None)

793

# check the header only

794

df, _ = knit._parse_record_header(key, raw_data)

795

df.close()

796

pos, size = writer.add_bytes_record(raw_data, names)

797

write_index.add_node(key, eol_flag + "%d %d" % (pos, size))

798

pb.update("Copied record", record_index)

799

record_index += 1

800

801

def _copy_nodes_graph(self, index_map, writer, write_index,

802

readv_group_iter, total_items, output_lines=False):

803

"""Copy knit nodes between packs.

804

805

:param output_lines: Return lines present in the copied data as

806

an iterator of line,version_id.

807

"""

808

pb = ui.ui_factory.nested_progress_bar()

809

try:

810

for result in self._do_copy_nodes_graph(index_map, writer,

811

write_index, output_lines, pb, readv_group_iter, total_items):

812

yield result

813

except Exception:

814

# Python 2.4 does not permit try:finally: in a generator.

815

pb.finished()

816

raise

817

else:

818

pb.finished()

819

820

def _do_copy_nodes_graph(self, index_map, writer, write_index,

821

output_lines, pb, readv_group_iter, total_items):

822

# for record verification

823

knit = KnitVersionedFiles(None, None)

824

# for line extraction when requested (inventories only)

825

if output_lines:

826

factory = KnitPlainFactory()

827

record_index = 0

828

pb.update("Copied record", record_index, total_items)

829

for index, readv_vector, node_vector in readv_group_iter:

830

# copy the data

831

transport, path = index_map[index]

832

reader = pack.make_readv_reader(transport, path, readv_vector)

833

for (names, read_func), (key, eol_flag, references) in \

834

izip(reader.iter_records(), node_vector):

835

raw_data = read_func(None)

836

if output_lines:

837

# read the entire thing

838

content, _ = knit._parse_record(key[-1], raw_data)

839

if len(references[-1]) == 0:

840

line_iterator = factory.get_fulltext_content(content)

841

else:

842

line_iterator = factory.get_linedelta_content(content)

843

for line in line_iterator:

844

yield line, key

845

else:

846

# check the header only

847

df, _ = knit._parse_record_header(key, raw_data)

848

df.close()

849

pos, size = writer.add_bytes_record(raw_data, names)

850

write_index.add_node(key, eol_flag + "%d %d" % (pos, size), references)

851

pb.update("Copied record", record_index)

852

record_index += 1

853

854

def _get_text_nodes(self):

855

text_index_map = self._pack_collection._packs_list_to_pack_map_and_index_list(

856

self.packs, 'text_index')[0]

857

return text_index_map, self._pack_collection._index_contents(text_index_map,

858

self._text_filter)

859

860

def _least_readv_node_readv(self, nodes):

861

"""Generate request groups for nodes using the least readv's.

862

863

:param nodes: An iterable of graph index nodes.

864

:return: Total node count and an iterator of the data needed to perform

865

readvs to obtain the data for nodes. Each item yielded by the

866

iterator is a tuple with:

867

index, readv_vector, node_vector. readv_vector is a list ready to

868

hand to the transport readv method, and node_vector is a list of

869

(key, eol_flag, references) for the the node retrieved by the

870

matching readv_vector.

871

"""

872

# group by pack so we do one readv per pack

873

nodes = sorted(nodes)

874

total = len(nodes)

875

request_groups = {}

876

for index, key, value, references in nodes:

877

if index not in request_groups:

878

request_groups[index] = []

879

request_groups[index].append((key, value, references))

880

result = []

881

for index, items in request_groups.iteritems():

882

pack_readv_requests = []

883

for key, value, references in items:

884

# ---- KnitGraphIndex.get_position

885

bits = value[1:].split(' ')

886

offset, length = int(bits[0]), int(bits[1])

887

pack_readv_requests.append(

888

((offset, length), (key, value[0], references)))

889

# linear scan up the pack to maximum range combining.

890

pack_readv_requests.sort()

891

# split out the readv and the node data.

892

pack_readv = [readv for readv, node in pack_readv_requests]

893

node_vector = [node for readv, node in pack_readv_requests]

894

result.append((index, pack_readv, node_vector))

895

return total, result

896

897

def _log_copied_texts(self):

898

if 'pack' in debug.debug_flags:

899

mutter('%s: create_pack: file texts copied: %s%s %d items t+%6.3fs',

900

time.ctime(), self._pack_collection._upload_transport.base,

901

self.new_pack.random_name,

902

self.new_pack.text_index.key_count(),

903

time.time() - self.new_pack.start_time)

904

905

def _process_inventory_lines(self, inv_lines):

906

"""Use up the inv_lines generator and setup a text key filter."""

907

repo = self._pack_collection.repo

908

fileid_revisions = repo._find_file_ids_from_xml_inventory_lines(

909

inv_lines, self.revision_keys)

910

text_filter = []

911

for fileid, file_revids in fileid_revisions.iteritems():

912

text_filter.extend([(fileid, file_revid) for file_revid in file_revids])

913

self._text_filter = text_filter

914

915

def _revision_node_readv(self, revision_nodes):

916

"""Return the total revisions and the readv's to issue.

917

918

:param revision_nodes: The revision index contents for the packs being

919

incorporated into the new pack.

920

:return: As per _least_readv_node_readv.

921

"""

922

return self._least_readv_node_readv(revision_nodes)

923

924

def _use_pack(self, new_pack):

925

"""Return True if new_pack should be used.

926

927

:param new_pack: The pack that has just been created.

928

:return: True if the pack should be used.

929

"""

930

return new_pack.data_inserted()

931

932

933

class OptimisingPacker(Packer):

934

"""A packer which spends more time to create better disk layouts."""

935

936

def _revision_node_readv(self, revision_nodes):

937

"""Return the total revisions and the readv's to issue.

938

939

This sort places revisions in topological order with the ancestors

940

after the children.

941

942

:param revision_nodes: The revision index contents for the packs being

943

incorporated into the new pack.

944

:return: As per _least_readv_node_readv.

945

"""

946

# build an ancestors dict

947

ancestors = {}

948

by_key = {}

949

for index, key, value, references in revision_nodes:

950

ancestors[key] = references[0]

951

by_key[key] = (index, value, references)

952

order = tsort.topo_sort(ancestors)

953

total = len(order)

954

# Single IO is pathological, but it will work as a starting point.

955

requests = []

956

for key in reversed(order):

957

index, value, references = by_key[key]

958

# ---- KnitGraphIndex.get_position

959

bits = value[1:].split(' ')

960

offset, length = int(bits[0]), int(bits[1])

961

requests.append(

962

(index, [(offset, length)], [(key, value[0], references)]))

963

# TODO: combine requests in the same index that are in ascending order.

964

return total, requests

965

966

967

class ReconcilePacker(Packer):

968

"""A packer which regenerates indices etc as it copies.

969

970

This is used by ``bzr reconcile`` to cause parent text pointers to be

971

regenerated.

972

"""

973

974

def _extra_init(self):

975

self._data_changed = False

976

977

def _process_inventory_lines(self, inv_lines):

978

"""Generate a text key reference map rather for reconciling with."""

979

repo = self._pack_collection.repo

980

refs = repo._find_text_key_references_from_xml_inventory_lines(

981

inv_lines)

982

self._text_refs = refs

983

# during reconcile we:

984

# - convert unreferenced texts to full texts

985

# - correct texts which reference a text not copied to be full texts

986

# - copy all others as-is but with corrected parents.

987

# - so at this point we don't know enough to decide what becomes a full

988

# text.

989

self._text_filter = None

990

991

def _copy_text_texts(self):

992

"""generate what texts we should have and then copy."""

993

self.pb.update("Copying content texts", 3)

994

# we have three major tasks here:

995

# 1) generate the ideal index

996

repo = self._pack_collection.repo

997

ancestors = dict([(key[0], tuple(ref[0] for ref in refs[0])) for

998

_1, key, _2, refs in

999

self.new_pack.revision_index.iter_all_entries()])

1000

ideal_index = repo._generate_text_key_index(self._text_refs, ancestors)

1001

# 2) generate a text_nodes list that contains all the deltas that can

1002

# be used as-is, with corrected parents.

1003

ok_nodes = []

1004

bad_texts = []

1005

discarded_nodes = []

1006

NULL_REVISION = _mod_revision.NULL_REVISION

1007

text_index_map, text_nodes = self._get_text_nodes()

1008

for node in text_nodes:

1009

# 0 - index

1010

# 1 - key

1011

# 2 - value

1012

# 3 - refs

1013

try:

1014

ideal_parents = tuple(ideal_index[node[1]])

1015

except KeyError:

1016

discarded_nodes.append(node)

1017

self._data_changed = True

1018

else:

1019

if ideal_parents == (NULL_REVISION,):

1020

ideal_parents = ()

1021

if ideal_parents == node[3][0]:

1022

# no change needed.

1023

ok_nodes.append(node)

1024

elif ideal_parents[0:1] == node[3][0][0:1]:

1025

# the left most parent is the same, or there are no parents

1026

# today. Either way, we can preserve the representation as

1027

# long as we change the refs to be inserted.

1028

self._data_changed = True

1029

ok_nodes.append((node[0], node[1], node[2],

1030

(ideal_parents, node[3][1])))

1031

self._data_changed = True

1032

else:

1033

# Reinsert this text completely

1034

bad_texts.append((node[1], ideal_parents))

1035

self._data_changed = True

1036

# we're finished with some data.

1037

del ideal_index

1038

del text_nodes

1039

# 3) bulk copy the ok data

1040

total_items, readv_group_iter = self._least_readv_node_readv(ok_nodes)

1041

list(self._copy_nodes_graph(text_index_map, self.new_pack._writer,

1042

self.new_pack.text_index, readv_group_iter, total_items))

1043

# 4) adhoc copy all the other texts.

1044

# We have to topologically insert all texts otherwise we can fail to

1045

# reconcile when parts of a single delta chain are preserved intact,

1046

# and other parts are not. E.g. Discarded->d1->d2->d3. d1 will be

1047

# reinserted, and if d3 has incorrect parents it will also be

1048

# reinserted. If we insert d3 first, d2 is present (as it was bulk

1049

# copied), so we will try to delta, but d2 is not currently able to be

1050

# extracted because it's basis d1 is not present. Topologically sorting

1051

# addresses this. The following generates a sort for all the texts that

1052

# are being inserted without having to reference the entire text key

1053

# space (we only topo sort the revisions, which is smaller).

1054

topo_order = tsort.topo_sort(ancestors)

1055

rev_order = dict(zip(topo_order, range(len(topo_order))))

1056

bad_texts.sort(key=lambda key:rev_order[key[0][1]])

1057

transaction = repo.get_transaction()

1058

file_id_index = GraphIndexPrefixAdapter(

1059

self.new_pack.text_index,

1060

('blank', ), 1,

1061

add_nodes_callback=self.new_pack.text_index.add_nodes)

1062

data_access = _DirectPackAccess(

1063

{self.new_pack.text_index:self.new_pack.access_tuple()})

1064

data_access.set_writer(self.new_pack._writer, self.new_pack.text_index,

1065

self.new_pack.access_tuple())

1066

output_texts = KnitVersionedFiles(

1067

_KnitGraphIndex(self.new_pack.text_index,

1068

add_callback=self.new_pack.text_index.add_nodes,

1069

deltas=True, parents=True, is_locked=repo.is_locked),

1070

data_access=data_access, max_delta_chain=200)

1071

for key, parent_keys in bad_texts:

1072

# We refer to the new pack to delta data being output.

1073

# A possible improvement would be to catch errors on short reads

1074

# and only flush then.

1075

self.new_pack.flush()

1076

parents = []

1077

for parent_key in parent_keys:

1078

if parent_key[0] != key[0]:

1079

# Graph parents must match the fileid

1080

raise errors.BzrError('Mismatched key parent %r:%r' %

1081

(key, parent_keys))

1082

parents.append(parent_key[1])

1083

text_lines = split_lines(repo.texts.get_record_stream(

1084

[key], 'unordered', True).next().get_bytes_as('fulltext'))

1085

output_texts.add_lines(key, parent_keys, text_lines,

1086

random_id=True, check_content=False)

1087

# 5) check that nothing inserted has a reference outside the keyspace.

1088

missing_text_keys = self.new_pack._external_compression_parents_of_texts()

1089

if missing_text_keys:

1090

raise errors.BzrError('Reference to missing compression parents %r'

1091

% (missing_text_keys,))

1092

self._log_copied_texts()

1093

1094

def _use_pack(self, new_pack):

1095

"""Override _use_pack to check for reconcile having changed content."""

1096

# XXX: we might be better checking this at the copy time.

1097

original_inventory_keys = set()

1098

inv_index = self._pack_collection.inventory_index.combined_index

1099

for entry in inv_index.iter_all_entries():

1100

original_inventory_keys.add(entry[1])

1101

new_inventory_keys = set()

1102

for entry in new_pack.inventory_index.iter_all_entries():

1103

new_inventory_keys.add(entry[1])

1104

if new_inventory_keys != original_inventory_keys:

1105

self._data_changed = True

1106

return new_pack.data_inserted() and self._data_changed

1107

1108

1109

class RepositoryPackCollection(object):

1110

"""Management of packs within a repository."""

1111

1112

def __init__(self, repo, transport, index_transport, upload_transport,

1113

pack_transport):

1114

"""Create a new RepositoryPackCollection.

1115

1116

:param transport: Addresses the repository base directory

1117

(typically .bzr/repository/).

1118

:param index_transport: Addresses the directory containing indices.

1119

:param upload_transport: Addresses the directory into which packs are written

1120

while they're being created.

1121

:param pack_transport: Addresses the directory of existing complete packs.

1122

"""

1123

self.repo = repo

1124

self.transport = transport

1125

self._index_transport = index_transport

1126

self._upload_transport = upload_transport

1127

self._pack_transport = pack_transport

1128

self._suffix_offsets = {'.rix': 0, '.iix': 1, '.tix': 2, '.six': 3}

1129

self.packs = []

1130

# name:Pack mapping

1131

self._packs_by_name = {}

1132

# the previous pack-names content

1133

self._packs_at_load = None

1134

# when a pack is being created by this object, the state of that pack.

1135

self._new_pack = None

1136

# aggregated revision index data

1137

self.revision_index = AggregateIndex()

1138

self.inventory_index = AggregateIndex()

1139

self.text_index = AggregateIndex()

1140

self.signature_index = AggregateIndex()

1141

1142

def add_pack_to_memory(self, pack):

1143

"""Make a Pack object available to the repository to satisfy queries.

1144

1145

:param pack: A Pack object.

1146

"""

1147

if pack.name in self._packs_by_name:

1148

raise AssertionError()

1149

self.packs.append(pack)

1150

self._packs_by_name[pack.name] = pack

1151

self.revision_index.add_index(pack.revision_index, pack)

1152

self.inventory_index.add_index(pack.inventory_index, pack)

1153

self.text_index.add_index(pack.text_index, pack)

1154

self.signature_index.add_index(pack.signature_index, pack)

1155

1156

def all_packs(self):

1157

"""Return a list of all the Pack objects this repository has.

1158

1159

Note that an in-progress pack being created is not returned.

1160

1161

:return: A list of Pack objects for all the packs in the repository.

1162

"""

1163

result = []

1164

for name in self.names():

1165

result.append(self.get_pack_by_name(name))

1166

return result

1167

1168

def autopack(self):

1169

"""Pack the pack collection incrementally.

1170

1171

This will not attempt global reorganisation or recompression,

1172

rather it will just ensure that the total number of packs does

1173

not grow without bound. It uses the _max_pack_count method to

1174

determine if autopacking is needed, and the pack_distribution

1175

method to determine the number of revisions in each pack.

1176

1177

If autopacking takes place then the packs name collection will have

1178

been flushed to disk - packing requires updating the name collection

1179

in synchronisation with certain steps. Otherwise the names collection

1180

is not flushed.

1181

1182

:return: True if packing took place.

1183

"""

1184

# XXX: Should not be needed when the management of indices is sane.

1185

total_revisions = self.revision_index.combined_index.key_count()

1186

total_packs = len(self._names)

1187

if self._max_pack_count(total_revisions) >= total_packs:

1188

return False

1189

# XXX: the following may want to be a class, to pack with a given

1190

# policy.

1191

mutter('Auto-packing repository %s, which has %d pack files, '

1192

'containing %d revisions into %d packs.', self, total_packs,

1193

total_revisions, self._max_pack_count(total_revisions))

1194

# determine which packs need changing

1195

pack_distribution = self.pack_distribution(total_revisions)

1196

existing_packs = []

1197

for pack in self.all_packs():

1198

revision_count = pack.get_revision_count()

1199

if revision_count == 0:

1200

# revision less packs are not generated by normal operation,

1201

# only by operations like sign-my-commits, and thus will not

1202

# tend to grow rapdily or without bound like commit containing

1203

# packs do - leave them alone as packing them really should

1204

# group their data with the relevant commit, and that may

1205

# involve rewriting ancient history - which autopack tries to

1206

# avoid. Alternatively we could not group the data but treat

1207

# each of these as having a single revision, and thus add

1208

# one revision for each to the total revision count, to get

1209

# a matching distribution.

1210

continue

1211

existing_packs.append((revision_count, pack))

1212

pack_operations = self.plan_autopack_combinations(

1213

existing_packs, pack_distribution)

1214

self._execute_pack_operations(pack_operations)

1215

return True

1216

1217

def _execute_pack_operations(self, pack_operations, _packer_class=Packer):

1218

"""Execute a series of pack operations.

1219

1220

:param pack_operations: A list of [revision_count, packs_to_combine].

1221

:param _packer_class: The class of packer to use (default: Packer).

1222

:return: None.

1223

"""

1224

for revision_count, packs in pack_operations:

1225

# we may have no-ops from the setup logic

1226

if len(packs) == 0:

1227

continue

1228

_packer_class(self, packs, '.autopack').pack()

1229

for pack in packs:

1230

self._remove_pack_from_memory(pack)

1231

# record the newly available packs and stop advertising the old

1232

# packs

1233

self._save_pack_names(clear_obsolete_packs=True)

1234

# Move the old packs out of the way now they are no longer referenced.

1235

for revision_count, packs in pack_operations:

1236

self._obsolete_packs(packs)

1237

1238

def lock_names(self):

1239

"""Acquire the mutex around the pack-names index.

1240

1241

This cannot be used in the middle of a read-only transaction on the

1242

repository.

1243

"""

1244

self.repo.control_files.lock_write()

1245

1246

def pack(self):

1247

"""Pack the pack collection totally."""

1248

self.ensure_loaded()

1249

total_packs = len(self._names)

1250

if total_packs < 2:

1251

# This is arguably wrong because we might not be optimal, but for

1252

# now lets leave it in. (e.g. reconcile -> one pack. But not

1253

# optimal.

1254

return

1255

total_revisions = self.revision_index.combined_index.key_count()

1256

# XXX: the following may want to be a class, to pack with a given

1257

# policy.

1258

mutter('Packing repository %s, which has %d pack files, '

1259

'containing %d revisions into 1 packs.', self, total_packs,

1260

total_revisions)

1261

# determine which packs need changing

1262

pack_distribution = [1]

1263

pack_operations = [[0, []]]

1264

for pack in self.all_packs():

1265

pack_operations[-1][0] += pack.get_revision_count()

1266

pack_operations[-1][1].append(pack)

1267

self._execute_pack_operations(pack_operations, OptimisingPacker)

1268

1269

def plan_autopack_combinations(self, existing_packs, pack_distribution):

1270

"""Plan a pack operation.

1271

1272

:param existing_packs: The packs to pack. (A list of (revcount, Pack)

1273

tuples).

1274

:param pack_distribution: A list with the number of revisions desired

1275

in each pack.

1276

"""

1277

if len(existing_packs) <= len(pack_distribution):

1278

return []

1279

existing_packs.sort(reverse=True)

1280

pack_operations = [[0, []]]

1281

# plan out what packs to keep, and what to reorganise

1282

while len(existing_packs):

1283

# take the largest pack, and if its less than the head of the

1284

# distribution chart we will include its contents in the new pack for

1285

# that position. If its larger, we remove its size from the

1286

# distribution chart

1287

next_pack_rev_count, next_pack = existing_packs.pop(0)

1288

if next_pack_rev_count >= pack_distribution[0]:

1289

# this is already packed 'better' than this, so we can

1290

# not waste time packing it.

1291

while next_pack_rev_count > 0:

1292

next_pack_rev_count -= pack_distribution[0]

1293

if next_pack_rev_count >= 0:

1294

# more to go

1295

del pack_distribution[0]

1296

else:

1297

# didn't use that entire bucket up

1298

pack_distribution[0] = -next_pack_rev_count

1299

else:

1300

# add the revisions we're going to add to the next output pack

1301

pack_operations[-1][0] += next_pack_rev_count

1302

# allocate this pack to the next pack sub operation

1303

pack_operations[-1][1].append(next_pack)

1304

if pack_operations[-1][0] >= pack_distribution[0]:

1305

# this pack is used up, shift left.

1306

del pack_distribution[0]

1307

pack_operations.append([0, []])

1308

1309

return pack_operations

1310

1311

def ensure_loaded(self):

1312

# NB: if you see an assertion error here, its probably access against

1313

# an unlocked repo. Naughty.

1314

if not self.repo.is_locked():

1315

raise errors.ObjectNotLocked(self.repo)

1316

if self._names is None:

1317

self._names = {}

1318

self._packs_at_load = set()

1319

for index, key, value in self._iter_disk_pack_index():

1320

name = key[0]

1321

self._names[name] = self._parse_index_sizes(value)

1322

self._packs_at_load.add((key, value))

1323

# populate all the metadata.

1324

self.all_packs()

1325

1326

def _parse_index_sizes(self, value):

1327

"""Parse a string of index sizes."""

1328

return tuple([int(digits) for digits in value.split(' ')])

1329

1330

def get_pack_by_name(self, name):

1331

"""Get a Pack object by name.

1332

1333

:param name: The name of the pack - e.g. '123456'

1334

:return: A Pack object.

1335

"""

1336

try:

1337

return self._packs_by_name[name]

1338

except KeyError:

1339

rev_index = self._make_index(name, '.rix')

1340

inv_index = self._make_index(name, '.iix')

1341

txt_index = self._make_index(name, '.tix')

1342

sig_index = self._make_index(name, '.six')

1343

result = ExistingPack(self._pack_transport, name, rev_index,

1344

inv_index, txt_index, sig_index)

1345

self.add_pack_to_memory(result)

1346

return result

1347

1348

def allocate(self, a_new_pack):

1349

"""Allocate name in the list of packs.

1350

1351

:param a_new_pack: A NewPack instance to be added to the collection of

1352

packs for this repository.

1353

"""

1354

self.ensure_loaded()

1355

if a_new_pack.name in self._names:

1356

raise errors.BzrError(

1357

'Pack %r already exists in %s' % (a_new_pack.name, self))

1358

self._names[a_new_pack.name] = tuple(a_new_pack.index_sizes)

1359

self.add_pack_to_memory(a_new_pack)

1360

1361

def _iter_disk_pack_index(self):

1362

"""Iterate over the contents of the pack-names index.

1363

1364

This is used when loading the list from disk, and before writing to

1365

detect updates from others during our write operation.

1366

:return: An iterator of the index contents.

1367

"""

1368

return GraphIndex(self.transport, 'pack-names', None

1369

).iter_all_entries()

1370

1371

def _make_index(self, name, suffix):

1372

size_offset = self._suffix_offsets[suffix]

1373

index_name = name + suffix

1374

index_size = self._names[name][size_offset]

1375

return GraphIndex(

1376

self._index_transport, index_name, index_size)

1377

1378

def _max_pack_count(self, total_revisions):

1379

"""Return the maximum number of packs to use for total revisions.

1380

1381

:param total_revisions: The total number of revisions in the

1382

repository.

1383

"""

1384

if not total_revisions:

1385

return 1

1386

digits = str(total_revisions)

1387

result = 0

1388

for digit in digits:

1389

result += int(digit)

1390

return result

1391

1392

def names(self):

1393

"""Provide an order to the underlying names."""

1394

return sorted(self._names.keys())

1395

1396

def _obsolete_packs(self, packs):

1397

"""Move a number of packs which have been obsoleted out of the way.

1398

1399

Each pack and its associated indices are moved out of the way.

1400

1401

Note: for correctness this function should only be called after a new

1402

pack names index has been written without these pack names, and with

1403

the names of packs that contain the data previously available via these

1404

packs.

1405

1406

:param packs: The packs to obsolete.

1407

:param return: None.

1408

"""

1409

for pack in packs:

1410

pack.pack_transport.rename(pack.file_name(),

1411

'../obsolete_packs/' + pack.file_name())

1412

# TODO: Probably needs to know all possible indices for this pack

1413

# - or maybe list the directory and move all indices matching this

1414

# name whether we recognize it or not?

1415

for suffix in ('.iix', '.six', '.tix', '.rix'):

1416

self._index_transport.rename(pack.name + suffix,

1417

'../obsolete_packs/' + pack.name + suffix)

1418

1419

def pack_distribution(self, total_revisions):

1420

"""Generate a list of the number of revisions to put in each pack.

1421

1422

:param total_revisions: The total number of revisions in the

1423

repository.

1424

"""

1425

if total_revisions == 0:

1426

return [0]

1427

digits = reversed(str(total_revisions))

1428

result = []

1429

for exponent, count in enumerate(digits):

1430

size = 10 ** exponent

1431

for pos in range(int(count)):

1432

result.append(size)

1433

return list(reversed(result))

1434

1435

def _pack_tuple(self, name):

1436

"""Return a tuple with the transport and file name for a pack name."""

1437

return self._pack_transport, name + '.pack'

1438

1439

def _remove_pack_from_memory(self, pack):

1440

"""Remove pack from the packs accessed by this repository.

1441

1442

Only affects memory state, until self._save_pack_names() is invoked.

1443

"""

1444

self._names.pop(pack.name)

1445

self._packs_by_name.pop(pack.name)

1446

self._remove_pack_indices(pack)

1447

1448

def _remove_pack_indices(self, pack):

1449

"""Remove the indices for pack from the aggregated indices."""

1450

self.revision_index.remove_index(pack.revision_index, pack)

1451

self.inventory_index.remove_index(pack.inventory_index, pack)

1452

self.text_index.remove_index(pack.text_index, pack)

1453

self.signature_index.remove_index(pack.signature_index, pack)

1454

1455

def reset(self):

1456

"""Clear all cached data."""

1457

# cached revision data

1458

self.repo._revision_knit = None

1459

self.revision_index.clear()

1460

# cached signature data

1461

self.repo._signature_knit = None

1462

self.signature_index.clear()

1463

# cached file text data

1464

self.text_index.clear()

1465

self.repo._text_knit = None

1466

# cached inventory data

1467

self.inventory_index.clear()

1468

# remove the open pack

1469

self._new_pack = None

1470

# information about packs.

1471

self._names = None

1472

self.packs = []

1473

self._packs_by_name = {}

1474

self._packs_at_load = None

1475

1476

def _make_index_map(self, index_suffix):

1477

"""Return information on existing indices.

1478

1479

:param suffix: Index suffix added to pack name.

1480

1481

:returns: (pack_map, indices) where indices is a list of GraphIndex

1482

objects, and pack_map is a mapping from those objects to the

1483

pack tuple they describe.

1484

"""

1485

# TODO: stop using this; it creates new indices unnecessarily.

1486

self.ensure_loaded()

1487

suffix_map = {'.rix': 'revision_index',

1488

'.six': 'signature_index',

1489

'.iix': 'inventory_index',

1490

'.tix': 'text_index',

1491

}

1492

return self._packs_list_to_pack_map_and_index_list(self.all_packs(),

1493

suffix_map[index_suffix])

1494

1495

def _packs_list_to_pack_map_and_index_list(self, packs, index_attribute):

1496

"""Convert a list of packs to an index pack map and index list.

1497

1498

:param packs: The packs list to process.

1499

:param index_attribute: The attribute that the desired index is found

1500

on.

1501

:return: A tuple (map, list) where map contains the dict from

1502

index:pack_tuple, and lsit contains the indices in the same order

1503

as the packs list.

1504

"""

1505

indices = []

1506

pack_map = {}

1507

for pack in packs:

1508

index = getattr(pack, index_attribute)

1509

indices.append(index)

1510

pack_map[index] = (pack.pack_transport, pack.file_name())

1511

return pack_map, indices

1512

1513

def _index_contents(self, pack_map, key_filter=None):

1514

"""Get an iterable of the index contents from a pack_map.

1515

1516

:param pack_map: A map from indices to pack details.

1517

:param key_filter: An optional filter to limit the

1518

keys returned.

1519

"""

1520

indices = [index for index in pack_map.iterkeys()]

1521

all_index = CombinedGraphIndex(indices)

1522

if key_filter is None:

1523

return all_index.iter_all_entries()

1524

else:

1525

return all_index.iter_entries(key_filter)

1526

1527

def _unlock_names(self):

1528

"""Release the mutex around the pack-names index."""

1529

self.repo.control_files.unlock()

1530

1531

def _save_pack_names(self, clear_obsolete_packs=False):

1532

"""Save the list of packs.

1533

1534

This will take out the mutex around the pack names list for the

1535

duration of the method call. If concurrent updates have been made, a

1536

three-way merge between the current list and the current in memory list

1537

is performed.

1538

1539

:param clear_obsolete_packs: If True, clear out the contents of the

1540

obsolete_packs directory.

1541

"""

1542

self.lock_names()

1543

try:

1544

builder = GraphIndexBuilder()

1545

# load the disk nodes across

1546

disk_nodes = set()

1547

for index, key, value in self._iter_disk_pack_index():

1548

disk_nodes.add((key, value))

1549

# do a two-way diff against our original content

1550

current_nodes = set()

1551

for name, sizes in self._names.iteritems():

1552

current_nodes.add(

1553

((name, ), ' '.join(str(size) for size in sizes)))

1554

deleted_nodes = self._packs_at_load - current_nodes

1555

new_nodes = current_nodes - self._packs_at_load

1556

disk_nodes.difference_update(deleted_nodes)

1557

disk_nodes.update(new_nodes)

1558

# TODO: handle same-name, index-size-changes here -

1559

# e.g. use the value from disk, not ours, *unless* we're the one

1560

# changing it.

1561

for key, value in disk_nodes:

1562

builder.add_node(key, value)

1563

self.transport.put_file('pack-names', builder.finish(),

1564

mode=self.repo.control_files._file_mode)

1565

# move the baseline forward

1566

self._packs_at_load = disk_nodes

1567

# now clear out the obsolete packs directory

1568

if clear_obsolete_packs:

1569

self.transport.clone('obsolete_packs').delete_multi(

1570

self.transport.list_dir('obsolete_packs'))

1571

finally:

1572

self._unlock_names()

1573

# synchronise the memory packs list with what we just wrote:

1574

new_names = dict(disk_nodes)

1575

# drop no longer present nodes

1576

for pack in self.all_packs():

1577

if (pack.name,) not in new_names:

1578

self._remove_pack_from_memory(pack)

1579

# add new nodes/refresh existing ones

1580

for key, value in disk_nodes:

1581

name = key[0]

1582

sizes = self._parse_index_sizes(value)

1583

if name in self._names:

1584

# existing

1585

if sizes != self._names[name]:

1586

# the pack for name has had its indices replaced - rare but

1587

# important to handle. XXX: probably can never happen today

1588

# because the three-way merge code above does not handle it

1589

# - you may end up adding the same key twice to the new

1590

# disk index because the set values are the same, unless

1591

# the only index shows up as deleted by the set difference

1592

# - which it may. Until there is a specific test for this,

1593

# assume its broken. RBC 20071017.

1594

self._remove_pack_from_memory(self.get_pack_by_name(name))

1595

self._names[name] = sizes

1596

self.get_pack_by_name(name)

1597

else:

1598

# new

1599

self._names[name] = sizes

1600

self.get_pack_by_name(name)

1601

1602

def _start_write_group(self):

1603

# Do not permit preparation for writing if we're not in a 'write lock'.

1604

if not self.repo.is_write_locked():

1605

raise errors.NotWriteLocked(self)

1606

self._new_pack = NewPack(self._upload_transport, self._index_transport,

1607

self._pack_transport, upload_suffix='.pack',

1608

file_mode=self.repo.control_files._file_mode)

1609

# allow writing: queue writes to a new index

1610

self.revision_index.add_writable_index(self._new_pack.revision_index,

1611

self._new_pack)

1612

self.inventory_index.add_writable_index(self._new_pack.inventory_index,

1613

self._new_pack)

1614

self.text_index.add_writable_index(self._new_pack.text_index,

1615

self._new_pack)

1616

self.signature_index.add_writable_index(self._new_pack.signature_index,

1617

self._new_pack)

1618

1619

self.repo.inventories._index._add_callback = self.inventory_index.add_callback

1620

self.repo.revisions._index._add_callback = self.revision_index.add_callback

1621

self.repo.signatures._index._add_callback = self.signature_index.add_callback

1622

self.repo.texts._index._add_callback = self.text_index.add_callback

1623

1624

def _abort_write_group(self):

1625

# FIXME: just drop the transient index.

1626

# forget what names there are

1627

if self._new_pack is not None:

1628

self._new_pack.abort()

1629

self._remove_pack_indices(self._new_pack)

1630

self._new_pack = None

1631

self.repo._text_knit = None

1632

1633

def _commit_write_group(self):

1634

self._remove_pack_indices(self._new_pack)

1635

if self._new_pack.data_inserted():

1636

# get all the data to disk and read to use

1637

self._new_pack.finish()

1638

self.allocate(self._new_pack)

1639

self._new_pack = None

1640

if not self.autopack():

1641

# when autopack takes no steps, the names list is still

1642

# unsaved.

1643

self._save_pack_names()

1644

else:

1645

self._new_pack.abort()

1646

self._new_pack = None

1647

self.repo._text_knit = None

1648

1649

1650

class KnitPackRepository(KnitRepository):

1651

"""Experimental graph-knit using repository."""

1652

1653

def __init__(self, _format, a_bzrdir, control_files, _commit_builder_class,

1654

_serializer):

1655

index_transport = control_files._transport.clone('indices')

1656

self._pack_collection = RepositoryPackCollection(self, control_files._transport,

1657

index_transport,

1658

control_files._transport.clone('upload'),

1659

control_files._transport.clone('packs'))

1660

KnitRepository.__init__(self, _format, a_bzrdir, control_files,

1661

_commit_builder_class, _serializer)

1662

self.inventories = KnitVersionedFiles(

1663

_KnitGraphIndex(self._pack_collection.inventory_index.combined_index,

1664

add_callback=self._pack_collection.inventory_index.add_callback,

1665

deltas=True, parents=True, is_locked=self.is_locked),

1666

data_access=self._pack_collection.inventory_index.data_access,

1667

max_delta_chain=200)

1668

self.revisions = KnitVersionedFiles(

1669

_KnitGraphIndex(self._pack_collection.revision_index.combined_index,

1670

add_callback=self._pack_collection.revision_index.add_callback,

1671

deltas=False, parents=True, is_locked=self.is_locked),

1672

data_access=self._pack_collection.revision_index.data_access,

1673

max_delta_chain=0)

1674

self.signatures = KnitVersionedFiles(

1675

_KnitGraphIndex(self._pack_collection.signature_index.combined_index,

1676

add_callback=self._pack_collection.signature_index.add_callback,

1677

deltas=False, parents=False, is_locked=self.is_locked),

1678

data_access=self._pack_collection.signature_index.data_access,

1679

max_delta_chain=0)

1680

self.texts = KnitVersionedFiles(

1681

_KnitGraphIndex(self._pack_collection.text_index.combined_index,

1682

add_callback=self._pack_collection.text_index.add_callback,

1683

deltas=True, parents=True, is_locked=self.is_locked),

1684

data_access=self._pack_collection.text_index.data_access,

1685

max_delta_chain=200)

1686

# True when the repository object is 'write locked' (as opposed to the

1687

# physical lock only taken out around changes to the pack-names list.)

1688

# Another way to represent this would be a decorator around the control

1689

# files object that presents logical locks as physical ones - if this

1690

# gets ugly consider that alternative design. RBC 20071011

1691

self._write_lock_count = 0

1692

self._transaction = None

1693

# for tests

1694

self._reconcile_does_inventory_gc = True

1695

self._reconcile_fixes_text_parents = True

1696

self._reconcile_backsup_inventory = False

1697

1698

def _abort_write_group(self):

1699

self._pack_collection._abort_write_group()

1700

1701

def _find_inconsistent_revision_parents(self):

1702

"""Find revisions with incorrectly cached parents.

1703

1704

:returns: an iterator yielding tuples of (revison-id, parents-in-index,

1705

parents-in-revision).

1706

"""

1707

if not self.is_locked():

1708

raise errors.ObjectNotLocked(self)

1709

pb = ui.ui_factory.nested_progress_bar()

1710

result = []

1711

try:

1712

revision_nodes = self._pack_collection.revision_index \

1713

.combined_index.iter_all_entries()

1714

index_positions = []

1715

# Get the cached index values for all revisions, and also the location

1716

# in each index of the revision text so we can perform linear IO.

1717

for index, key, value, refs in revision_nodes:

1718

pos, length = value[1:].split(' ')

1719

index_positions.append((index, int(pos), key[0],

1720

tuple(parent[0] for parent in refs[0])))

1721

pb.update("Reading revision index.", 0, 0)

1722

index_positions.sort()

1723

batch_count = len(index_positions) / 1000 + 1

1724

pb.update("Checking cached revision graph.", 0, batch_count)

1725

for offset in xrange(batch_count):

1726

pb.update("Checking cached revision graph.", offset)

1727

to_query = index_positions[offset * 1000:(offset + 1) * 1000]

1728

if not to_query:

1729

break

1730

rev_ids = [item[2] for item in to_query]

1731

revs = self.get_revisions(rev_ids)

1732

for revision, item in zip(revs, to_query):

1733

index_parents = item[3]

1734

rev_parents = tuple(revision.parent_ids)

1735

if index_parents != rev_parents:

1736

result.append((revision.revision_id, index_parents, rev_parents))

1737

finally:

1738

pb.finished()

1739

return result

1740

1741

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1742

def get_parents(self, revision_ids):

1743

"""See graph._StackedParentsProvider.get_parents."""

1744

parent_map = self.get_parent_map(revision_ids)

1745

return [parent_map.get(r, None) for r in revision_ids]

1746

1747

def get_parent_map(self, keys):

1748

"""See graph._StackedParentsProvider.get_parent_map

1749

1750

This implementation accesses the combined revision index to provide

1751

answers.

1752

"""

1753

self._pack_collection.ensure_loaded()

1754

index = self._pack_collection.revision_index.combined_index

1755

keys = set(keys)

1756

if _mod_revision.NULL_REVISION in keys:

1757

keys.discard(_mod_revision.NULL_REVISION)

1758

found_parents = {_mod_revision.NULL_REVISION:()}

1759

else:

1760

found_parents = {}

1761

search_keys = set((revision_id,) for revision_id in keys)

1762

for index, key, value, refs in index.iter_entries(search_keys):

1763

parents = refs[0]

1764

if not parents:

1765

parents = (_mod_revision.NULL_REVISION,)

1766

else:

1767

parents = tuple(parent[0] for parent in parents)

1768

found_parents[key[0]] = parents

1769

return found_parents

1770

1771

def has_revisions(self, revision_ids):

1772

"""See Repository.has_revisions()."""

1773

revision_ids = set(revision_ids)

1774

result = revision_ids.intersection(

1775

set([None, _mod_revision.NULL_REVISION]))

1776

revision_ids.difference_update(result)

1777

index = self._pack_collection.revision_index.combined_index

1778

keys = [(revision_id,) for revision_id in revision_ids]

1779

result.update(node[1][0] for node in index.iter_entries(keys))

1780

return result

1781

1782

def _make_parents_provider(self):

1783

return graph.CachingParentsProvider(self)

1784

1785

def _refresh_data(self):

1786

if self._write_lock_count == 1 or (

1787

self.control_files._lock_count == 1 and

1788

self.control_files._lock_mode == 'r'):

1789

# forget what names there are

1790

self._pack_collection.reset()

1791

# XXX: Better to do an in-memory merge when acquiring a new lock -

1792

# factor out code from _save_pack_names.

1793

self._pack_collection.ensure_loaded()

1794

1795

def _start_write_group(self):

1796

self._pack_collection._start_write_group()

1797

1798

def _commit_write_group(self):

1799

return self._pack_collection._commit_write_group()

1800

1801

def get_transaction(self):

1802

if self._write_lock_count:

1803

return self._transaction

1804

else:

1805

return self.control_files.get_transaction()

1806

1807

def is_locked(self):

1808

return self._write_lock_count or self.control_files.is_locked()

1809

1810

def is_write_locked(self):

1811

return self._write_lock_count

1812

1813

def lock_write(self, token=None):

1814

if not self._write_lock_count and self.is_locked():

1815

raise errors.ReadOnlyError(self)

1816

self._write_lock_count += 1

1817

if self._write_lock_count == 1:

1818

from bzrlib import transactions

1819

self._transaction = transactions.WriteTransaction()

1820

self._refresh_data()

1821

1822

def lock_read(self):

1823

if self._write_lock_count:

1824

self._write_lock_count += 1

1825

else:

1826

self.control_files.lock_read()

1827

self._refresh_data()

1828

1829

def leave_lock_in_place(self):

1830

# not supported - raise an error

1831

raise NotImplementedError(self.leave_lock_in_place)

1832

1833

def dont_leave_lock_in_place(self):

1834

# not supported - raise an error

1835

raise NotImplementedError(self.dont_leave_lock_in_place)

1836

1837

@needs_write_lock

1838

def pack(self):

1839

"""Compress the data within the repository.

1840

1841

This will pack all the data to a single pack. In future it may

1842

recompress deltas or do other such expensive operations.

1843

"""

1844

self._pack_collection.pack()

1845

1846

@needs_write_lock

1847

def reconcile(self, other=None, thorough=False):

1848

"""Reconcile this repository."""

1849

from bzrlib.reconcile import PackReconciler

1850

reconciler = PackReconciler(self, thorough=thorough)

1851

reconciler.reconcile()

1852

return reconciler

1853

1854

def unlock(self):

1855

if self._write_lock_count == 1 and self._write_group is not None:

1856

self.abort_write_group()

1857

self._transaction = None

1858

self._write_lock_count = 0

1859

raise errors.BzrError(

1860

'Must end write group before releasing write lock on %s'

1861

% self)

1862

if self._write_lock_count:

1863

self._write_lock_count -= 1

1864

if not self._write_lock_count:

1865

transaction = self._transaction

1866

self._transaction = None

1867

transaction.finish()

1868

else:

1869

self.control_files.unlock()

1870

1871

1872

class RepositoryFormatPack(MetaDirRepositoryFormat):

1873

"""Format logic for pack structured repositories.

1874

1875

This repository format has:

1876

- a list of packs in pack-names

1877

- packs in packs/NAME.pack

1878

- indices in indices/NAME.{iix,six,tix,rix}

1879

- knit deltas in the packs, knit indices mapped to the indices.

1880

- thunk objects to support the knits programming API.

1881

- a format marker of its own

1882

- an optional 'shared-storage' flag

1883

- an optional 'no-working-trees' flag

1884

- a LockDir lock

1885

"""

1886

1887

# Set this attribute in derived classes to control the repository class

1888

# created by open and initialize.

1889

repository_class = None

1890

# Set this attribute in derived classes to control the

1891

# _commit_builder_class that the repository objects will have passed to

1892

# their constructor.

1893

_commit_builder_class = None

1894

# Set this attribute in derived clases to control the _serializer that the

1895

# repository objects will have passed to their constructor.

1896

_serializer = None

1897

# External references are not supported in pack repositories yet.

1898

supports_external_lookups = False

1899

1900

def initialize(self, a_bzrdir, shared=False):

1901

"""Create a pack based repository.

1902

1903

:param a_bzrdir: bzrdir to contain the new repository; must already

1904

be initialized.

1905

:param shared: If true the repository will be initialized as a shared

1906

repository.

1907

"""

1908

mutter('creating repository in %s.', a_bzrdir.transport.base)

1909

dirs = ['indices', 'obsolete_packs', 'packs', 'upload']

1910

builder = GraphIndexBuilder()

1911

files = [('pack-names', builder.finish())]

1912

utf8_files = [('format', self.get_format_string())]

1913

1914

self._upload_blank_content(a_bzrdir, dirs, files, utf8_files, shared)

1915

return self.open(a_bzrdir=a_bzrdir, _found=True)

1916

1917

def open(self, a_bzrdir, _found=False, _override_transport=None):

1918

"""See RepositoryFormat.open().

1919

1920

:param _override_transport: INTERNAL USE ONLY. Allows opening the

1921

repository at a slightly different url

1922

than normal. I.e. during 'upgrade'.

1923

"""

1924

if not _found:

1925

format = RepositoryFormat.find_format(a_bzrdir)

1926

if _override_transport is not None:

1927

repo_transport = _override_transport

1928

else:

1929

repo_transport = a_bzrdir.get_repository_transport(None)

1930

control_files = lockable_files.LockableFiles(repo_transport,

1931

'lock', lockdir.LockDir)

1932

return self.repository_class(_format=self,

1933

a_bzrdir=a_bzrdir,

1934

control_files=control_files,

1935

_commit_builder_class=self._commit_builder_class,

1936

_serializer=self._serializer)

1937

1938

1939

class RepositoryFormatKnitPack1(RepositoryFormatPack):

1940

"""A no-subtrees parameterized Pack repository.

1941

1942

This format was introduced in 0.92.

1943

"""

1944

1945

repository_class = KnitPackRepository

1946

_commit_builder_class = PackCommitBuilder

1947

_serializer = xml5.serializer_v5

1948

1949

def _get_matching_bzrdir(self):

1950

return bzrdir.format_registry.make_bzrdir('pack-0.92')

1951

1952

def _ignore_setting_bzrdir(self, format):

1953

pass

1954

1955

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1956

1957

def get_format_string(self):

1958

"""See RepositoryFormat.get_format_string()."""

1959

return "Bazaar pack repository format 1 (needs bzr 0.92)\n"

1960

1961

def get_format_description(self):

1962

"""See RepositoryFormat.get_format_description()."""

1963

return "Packs containing knits without subtree support"

1964

1965

def check_conversion_target(self, target_format):

1966

pass

1967

1968

1969

class RepositoryFormatKnitPack3(RepositoryFormatPack):

1970

"""A subtrees parameterized Pack repository.

1971

1972

This repository format uses the xml7 serializer to get:

1973

- support for recording full info about the tree root

1974

- support for recording tree-references

1975

1976

This format was introduced in 0.92.

1977

"""

1978

1979

repository_class = KnitPackRepository

1980

_commit_builder_class = PackRootCommitBuilder

1981

rich_root_data = True

1982

supports_tree_reference = True

1983

_serializer = xml7.serializer_v7

1984

1985

def _get_matching_bzrdir(self):

1986

return bzrdir.format_registry.make_bzrdir(

1987

'pack-0.92-subtree')

1988

1989

def _ignore_setting_bzrdir(self, format):

1990

pass

1991

1992

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1993

1994

def check_conversion_target(self, target_format):

1995

if not target_format.rich_root_data:

1996

raise errors.BadConversionTarget(

1997

'Does not support rich root data.', target_format)

1998

if not getattr(target_format, 'supports_tree_reference', False):

1999

raise errors.BadConversionTarget(

2000

'Does not support nested trees', target_format)

2001

2002

def get_format_string(self):

2003

"""See RepositoryFormat.get_format_string()."""

2004

return "Bazaar pack repository format 1 with subtree support (needs bzr 0.92)\n"

2005

2006

def get_format_description(self):

2007

"""See RepositoryFormat.get_format_description()."""

2008

return "Packs containing knits with subtree support\n"

2009

2010

2011

class RepositoryFormatKnitPack4(RepositoryFormatPack):

2012

"""A rich-root, no subtrees parameterized Pack repository.

2013

2014

This repository format uses the xml6 serializer to get:

2015

- support for recording full info about the tree root

2016

2017

This format was introduced in 1.0.

2018

"""

2019

2020

repository_class = KnitPackRepository

2021

_commit_builder_class = PackRootCommitBuilder

2022

rich_root_data = True

2023

supports_tree_reference = False

2024

_serializer = xml6.serializer_v6

2025

2026

def _get_matching_bzrdir(self):

2027

return bzrdir.format_registry.make_bzrdir(

2028

'rich-root-pack')

2029

2030

def _ignore_setting_bzrdir(self, format):

2031

pass

2032

2033

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

2034

2035

def check_conversion_target(self, target_format):

2036

if not target_format.rich_root_data:

2037

raise errors.BadConversionTarget(

2038

'Does not support rich root data.', target_format)

2039

2040

def get_format_string(self):

2041

"""See RepositoryFormat.get_format_string()."""

2042

return ("Bazaar pack repository format 1 with rich root"

2043

" (needs bzr 1.0)\n")

2044

2045

def get_format_description(self):

2046

"""See RepositoryFormat.get_format_description()."""

2047

return "Packs containing knits with rich root support\n"

2048

2049

2050

class RepositoryFormatPackDevelopment0(RepositoryFormatPack):

2051

"""A no-subtrees development repository.

2052

2053

This format should be retained until the second release after bzr 1.0.

2054

2055

No changes to the disk behaviour from pack-0.92.

2056

"""

2057

2058

repository_class = KnitPackRepository

2059

_commit_builder_class = PackCommitBuilder

2060

_serializer = xml5.serializer_v5

2061

2062

def _get_matching_bzrdir(self):

2063

return bzrdir.format_registry.make_bzrdir('development0')

2064

2065

def _ignore_setting_bzrdir(self, format):

2066

pass

2067

2068

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

2069

2070

def get_format_string(self):

2071

"""See RepositoryFormat.get_format_string()."""

2072

return "Bazaar development format 0 (needs bzr.dev from before 1.3)\n"

2073

2074

def get_format_description(self):

2075

"""See RepositoryFormat.get_format_description()."""

2076

return ("Development repository format, currently the same as "

2077

"pack-0.92\n")

2078

2079

def check_conversion_target(self, target_format):

2080

pass

2081

2082

2083

class RepositoryFormatPackDevelopment0Subtree(RepositoryFormatPack):

2084

"""A subtrees development repository.

2085

2086

This format should be retained until the second release after bzr 1.0.

2087

2088

No changes to the disk behaviour from pack-0.92-subtree.

2089

"""

2090

2091

repository_class = KnitPackRepository

2092

_commit_builder_class = PackRootCommitBuilder

2093

rich_root_data = True

2094

supports_tree_reference = True

2095

_serializer = xml7.serializer_v7

2096

2097

def _get_matching_bzrdir(self):

2098

return bzrdir.format_registry.make_bzrdir(

2099

'development0-subtree')

2100

2101

def _ignore_setting_bzrdir(self, format):

2102

pass

2103

2104

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

2105

2106

def check_conversion_target(self, target_format):

2107

if not target_format.rich_root_data:

2108

raise errors.BadConversionTarget(

2109

'Does not support rich root data.', target_format)

2110

if not getattr(target_format, 'supports_tree_reference', False):

2111

raise errors.BadConversionTarget(

2112

'Does not support nested trees', target_format)

2113

2114

def get_format_string(self):

2115

"""See RepositoryFormat.get_format_string()."""

2116

return ("Bazaar development format 0 with subtree support "

2117

"(needs bzr.dev from before 1.3)\n")

2118

2119

def get_format_description(self):

2120

"""See RepositoryFormat.get_format_description()."""

2121

return ("Development repository format, currently the same as "

2122

"pack-0.92-subtree\n")

2123

2124

Older »