/brz/remove-bazaar : revision 4501.1.1

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/repository.py

Committer: Robert Collins
Date: 2009-07-02 07:22:27 UTC
mto: This revision was merged to the branch mainline in revision 4505.
Revision ID: robertc@robertcollins.net-20090702072227-a2yzortdrjcnls5c

Add documentation describing how and why we use inventory deltas, and what can go wrong with them.

files added:
bzrlib/textui.py

bzrlib/weave_commands.py

contrib/fortune

doc/bazaar-vcs.org.kid

doc/en/developer-guide

doc/en/user-guide/index.txt

doc/es/guia-desarrollador

doc/es/notas-version

doc/es/referencia

tools/biobench.py

tools/history2revfiles.py

files removed:
.testr.conf

MANIFEST.in

NEWS-template.txt

README_BDIST_RPM

apport

apport/README

apport/bzr-crashdb.conf

apport/source_bzr.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_import_c_api.h

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/cleanup.py

bzrlib/cmdline.py

bzrlib/crash.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/help_topics/en/location-alias.txt

bzrlib/help_topics/es

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/static_tuple.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/commands/test_revert.py

bzrlib/tests/features.py

bzrlib/tests/matchers.py

bzrlib/tests/per_bzrdir_colo

bzrlib/tests/per_bzrdir_colo/__init__.py

bzrlib/tests/per_bzrdir_colo/test_supported.py

bzrlib/tests/per_bzrdir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/script.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_script.py

bzrlib/tests/test_server.py

bzrlib/transport/pathfilter.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/apport.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/implementation-notes.txt

doc/developers/index-plain.txt

doc/developers/miscellaneous-notes.txt

doc/developers/plans.txt

doc/developers/principles.txt

doc/developers/specifications.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/quick-reference/index.txt

doc/en/tutorials/index.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/whats-new

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/quick-reference/index.txt

doc/es/user-guide/index-plain.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/quick-reference/index.txt

doc/ru/user-guide/index-plain.txt

tools/generate_release_notes.py

tools/package_docs.py

tools/packaging/update-control.sh

tools/win32/bootstrap.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

files renamed:
bzrlib/help_topics/en/conflict-types.txt => bzrlib/help_topics/en/conflicts.txt

bzrlib/tests/per_branch/ => bzrlib/tests/branch_implementations/

bzrlib/tests/per_bzrdir/ => bzrlib/tests/bzrdir_implementations/

bzrlib/tests/per_interrepository/ => bzrlib/tests/interrepository_implementations/

bzrlib/tests/per_intertree/ => bzrlib/tests/intertree_implementations/

bzrlib/tests/per_inventory/ => bzrlib/tests/inventory_implementations/

bzrlib/tests/test__bencode.py => bzrlib/tests/test_bencode.py

bzrlib/tests/per_pack_repository.py => bzrlib/tests/test_pack_repository.py

bzrlib/tests/per_transport.py => bzrlib/tests/test_transport_implementations.py

bzrlib/tests/per_versionedfile.py => bzrlib/tests/test_versionedfile.py

bzrlib/tests/per_tree/ => bzrlib/tests/tree_implementations/

bzrlib/tests/per_workingtree/ => bzrlib/tests/workingtree_implementations/

doc/developers/HACKING.txt => doc/en/developer-guide/HACKING.txt

doc/en/_static/en/Makefile => doc/en/quick-reference/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf => doc/en/quick-reference/quick-start-summary.pdf

doc/en/_static/en/bzr-en-quick-reference.png => doc/en/quick-reference/quick-start-summary.png

doc/en/_static/en/bzr-en-quick-reference.svg => doc/en/quick-reference/quick-start-summary.svg

doc/es/user-guide/ => doc/es/guia-usuario/

bzrlib/help_topics/es/conflict-types.txt => doc/es/guia-usuario/resolving_conflicts.txt

doc/es/quick-reference/ => doc/es/referencia-rapida/

doc/es/_static/es/Makefile => doc/es/referencia-rapida/Makefile

doc/es/_static/es/bzr-es-quick-reference.svg => doc/es/referencia-rapida/referencia-rapida.svg

doc/es/index.txt => doc/index.es.txt

doc/ru/index.txt => doc/index.ru.txt

doc/ru/_static/ru/Makefile => doc/ru/quick-reference/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf => doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png => doc/ru/quick-reference/quick-start-summary.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg => doc/ru/quick-reference/quick-start-summary.svg

files modified:
.bzrignore

INSTALL

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/bencode.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/foreign.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/bzrdir_implementations/test_push.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_file_with_stat.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/version.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/add.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/update.txt

doc/en/admin-guide/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial/index.txt

doc/index.txt

doc/ru/mini-tutorial/index.txt

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/zen.txt

profile_imports.py

setup.py

tools/generate_docs.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/win32/build_release.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/info.txt

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

bzrdir,

check,

chk_map,

config,

debug,

errors,

fetch as _mod_fetch,

fifo_cache,

generate_ids,

gpg,

graph,

inventory,

inventory_delta,

lazy_regex,

lockable_files,

lockdir,

lru_cache,

osutils,

revision as _mod_revision,

static_tuple,

symbol_versioning,

trace,

tsort,

ui,

versionedfile,

from bzrlib.testament import Testament

""")

from bzrlib.decorators import needs_read_lock, needs_write_lock, only_raises

from bzrlib.decorators import needs_read_lock, needs_write_lock

from bzrlib.inter import InterObject

from bzrlib.inventory import (

Inventory,

ROOT_ID,

entry_factory,

)

from bzrlib.lock import _RelockDebugMixin

from bzrlib import registry

from bzrlib.symbol_versioning import (

deprecated_method,

)

from bzrlib.trace import (

log_exception_quietly, note, mutter, mutter_callsite, warning)

210

207

# an inventory delta was accumulated without creating a new

211

208

# inventory.

212

209

basis_id = self.basis_delta_revision

213

# We ignore the 'inventory' returned by add_inventory_by_delta

214

# because self.new_inventory is used to hint to the rest of the

215

# system what code path was taken

216

self.inv_sha1, _ = self.repository.add_inventory_by_delta(

210

self.inv_sha1 = self.repository.add_inventory_by_delta(

217

211

basis_id, self._basis_delta, self._new_revision_id,

218

212

self.parents)

219

213

else:

473

467

if content_summary[2] is None:

474

468

raise ValueError("Files must not have executable = None")

475

469

if not store:

476

# We can't trust a check of the file length because of content

477

# filtering...

478

if (# if the exec bit has changed we have to store:

470

if (# if the file length changed we have to store:

471

parent_entry.text_size != content_summary[1] or

472

# if the exec bit has changed we have to store:

479

473

parent_entry.executable != content_summary[2]):

480

474

store = True

481

475

elif parent_entry.text_sha1 == content_summary[3]:

548

542

ie.revision = parent_entry.revision

549

543

return self._get_delta(ie, basis_inv, path), False, None

550

544

ie.reference_revision = content_summary[3]

551

if ie.reference_revision is None:

552

raise AssertionError("invalid content_summary for nested tree: %r"

553

% (content_summary,))

554

545

self._add_text_to_weave(ie.file_id, '', heads, None)

555

546

else:

556

547

raise NotImplementedError('unknown kind')

797

788

# references.

798

789

raise errors.UnsupportedOperation(tree.add_reference,

799

790

self.repository)

800

reference_revision = tree.get_reference_revision(change[0])

801

entry.reference_revision = reference_revision

791

entry.reference_revision = \

792

tree.get_reference_revision(change[0])

802

793

if (carry_over_possible and

803

794

parent_entry.reference_revision == reference_revision):

804

795

carried_over = True

818

809

seen_root = True

819

810

self.new_inventory = None

820

811

if len(inv_delta):

821

# This should perhaps be guarded by a check that the basis we

822

# commit against is the basis for the commit and if not do a delta

823

# against the basis.

824

812

self._any_changes = True

825

813

if not seen_root:

826

814

# housekeeping root entry changes do not affect no-change commits.

860

848

# versioned roots do not change unless the tree found a change.

861

849

862

850

863

class RepositoryWriteLockResult(object):

864

"""The result of write locking a repository.

865

866

:ivar repository_token: The token obtained from the underlying lock, or

867

None.

868

:ivar unlock: A callable which will unlock the lock.

869

"""

870

871

def __init__(self, unlock, repository_token):

872

self.repository_token = repository_token

873

self.unlock = unlock

874

875

876

851

######################################################################

877

852

# Repositories

878

853

879

880

class Repository(_RelockDebugMixin, bzrdir.ControlComponent):

854

class Repository(object):

881

855

"""Repository holding history for one or more branches.

882

856

883

857

The repository holds and retrieves historical information including

952

926

"""

953

927

if self._write_group is not self.get_transaction():

954

928

# has an unlock or relock occured ?

955

if suppress_errors:

956

mutter(

957

'(suppressed) mismatched lock context and write group. %r, %r',

958

self._write_group, self.get_transaction())

959

return

960

929

raise errors.BzrError(

961

930

'mismatched lock context and write group. %r, %r' %

962

931

(self._write_group, self.get_transaction()))

1041

1010

1042

1011

:seealso: add_inventory, for the contract.

1043

1012

"""

1044

inv_lines = self._serializer.write_inventory_to_lines(inv)

1013

inv_lines = self._serialise_inventory_to_lines(inv)

1045

1014

return self._inventory_add_lines(revision_id, parents,

1046

1015

inv_lines, check_content=False)

1047

1016

1096

1065

check_content=True):

1097

1066

"""Store lines in inv_vf and return the sha1 of the inventory."""

1098

1067

parents = [(parent,) for parent in parents]

1099

result = self.inventories.add_lines((revision_id,), parents, lines,

1068

return self.inventories.add_lines((revision_id,), parents, lines,

1100

1069

check_content=check_content)[0]

1101

self.inventories._access.flush()

1102

return result

1103

1070

1104

1071

def add_revision(self, revision_id, rev, inv=None, config=None):

1105

1072

"""Add rev to the revision store as revision_id.

1181

1148

# The old API returned a list, should this actually be a set?

1182

1149

return parent_map.keys()

1183

1150

1184

def _check_inventories(self, checker):

1185

"""Check the inventories found from the revision scan.

1186

1187

This is responsible for verifying the sha1 of inventories and

1188

creating a pending_keys set that covers data referenced by inventories.

1189

"""

1190

bar = ui.ui_factory.nested_progress_bar()

1191

try:

1192

self._do_check_inventories(checker, bar)

1193

finally:

1194

bar.finished()

1195

1196

def _do_check_inventories(self, checker, bar):

1197

"""Helper for _check_inventories."""

1198

revno = 0

1199

keys = {'chk_bytes':set(), 'inventories':set(), 'texts':set()}

1200

kinds = ['chk_bytes', 'texts']

1201

count = len(checker.pending_keys)

1202

bar.update("inventories", 0, 2)

1203

current_keys = checker.pending_keys

1204

checker.pending_keys = {}

1205

# Accumulate current checks.

1206

for key in current_keys:

1207

if key[0] != 'inventories' and key[0] not in kinds:

1208

checker._report_items.append('unknown key type %r' % (key,))

1209

keys[key[0]].add(key[1:])

1210

if keys['inventories']:

1211

# NB: output order *should* be roughly sorted - topo or

1212

# inverse topo depending on repository - either way decent

1213

# to just delta against. However, pre-CHK formats didn't

1214

# try to optimise inventory layout on disk. As such the

1215

# pre-CHK code path does not use inventory deltas.

1216

last_object = None

1217

for record in self.inventories.check(keys=keys['inventories']):

1218

if record.storage_kind == 'absent':

1219

checker._report_items.append(

1220

'Missing inventory {%s}' % (record.key,))

1221

else:

1222

last_object = self._check_record('inventories', record,

1223

checker, last_object,

1224

current_keys[('inventories',) + record.key])

1225

del keys['inventories']

1226

else:

1227

return

1228

bar.update("texts", 1)

1229

while (checker.pending_keys or keys['chk_bytes']

1230

or keys['texts']):

1231

# Something to check.

1232

current_keys = checker.pending_keys

1233

checker.pending_keys = {}

1234

# Accumulate current checks.

1235

for key in current_keys:

1236

if key[0] not in kinds:

1237

checker._report_items.append('unknown key type %r' % (key,))

1238

keys[key[0]].add(key[1:])

1239

# Check the outermost kind only - inventories || chk_bytes || texts

1240

for kind in kinds:

1241

if keys[kind]:

1242

last_object = None

1243

for record in getattr(self, kind).check(keys=keys[kind]):

1244

if record.storage_kind == 'absent':

1245

checker._report_items.append(

1246

'Missing %s {%s}' % (kind, record.key,))

1247

else:

1248

last_object = self._check_record(kind, record,

1249

checker, last_object, current_keys[(kind,) + record.key])

1250

keys[kind] = set()

1251

break

1252

1253

def _check_record(self, kind, record, checker, last_object, item_data):

1254

"""Check a single text from this repository."""

1255

if kind == 'inventories':

1256

rev_id = record.key[0]

1257

inv = self._deserialise_inventory(rev_id,

1258

record.get_bytes_as('fulltext'))

1259

if last_object is not None:

1260

delta = inv._make_delta(last_object)

1261

for old_path, path, file_id, ie in delta:

1262

if ie is None:

1263

continue

1264

ie.check(checker, rev_id, inv)

1265

else:

1266

for path, ie in inv.iter_entries():

1267

ie.check(checker, rev_id, inv)

1268

if self._format.fast_deltas:

1269

return inv

1270

elif kind == 'chk_bytes':

1271

# No code written to check chk_bytes for this repo format.

1272

checker._report_items.append(

1273

'unsupported key type chk_bytes for %s' % (record.key,))

1274

elif kind == 'texts':

1275

self._check_text(record, checker, item_data)

1276

else:

1277

checker._report_items.append(

1278

'unknown key type %s for %s' % (kind, record.key))

1279

1280

def _check_text(self, record, checker, item_data):

1281

"""Check a single text."""

1282

# Check it is extractable.

1283

# TODO: check length.

1284

if record.storage_kind == 'chunked':

1285

chunks = record.get_bytes_as(record.storage_kind)

1286

sha1 = osutils.sha_strings(chunks)

1287

length = sum(map(len, chunks))

1288

else:

1289

content = record.get_bytes_as('fulltext')

1290

sha1 = osutils.sha_string(content)

1291

length = len(content)

1292

if item_data and sha1 != item_data[1]:

1293

checker._report_items.append(

1294

'sha1 mismatch: %s has sha1 %s expected %s referenced by %s' %

1295

(record.key, sha1, item_data[1], item_data[2]))

1296

1297

1151

@staticmethod

1298

1152

def create(a_bzrdir):

1299

1153

"""Construct the current default format repository in a_bzrdir."""

1304

1158

1305

1159

:param _format: The format of the repository on disk.

1306

1160

:param a_bzrdir: The BzrDir of the repository.

1161

1162

In the future we will have a single api for all stores for

1163

getting file texts, inventories and revisions, then

1164

this construct will accept instances of those things.

1307

1165

"""

1308

# In the future we will have a single api for all stores for

1309

# getting file texts, inventories and revisions, then

1310

# this construct will accept instances of those things.

1311

1166

super(Repository, self).__init__()

1312

1167

self._format = _format

1313

1168

# the following are part of the public API for Repository:

1319

1174

self._reconcile_does_inventory_gc = True

1320

1175

self._reconcile_fixes_text_parents = False

1321

1176

self._reconcile_backsup_inventory = True

1177

# not right yet - should be more semantically clear ?

1178

1179

# TODO: make sure to construct the right store classes, etc, depending

1180

# on whether escaping is required.

1181

self._warn_if_deprecated()

1322

1182

self._write_group = None

1323

1183

# Additional places to query for data.

1324

1184

self._fallback_repositories = []

1325

1185

# An InventoryEntry cache, used during deserialization

1326

1186

self._inventory_entry_cache = fifo_cache.FIFOCache(10*1024)

1327

# Is it safe to return inventory entries directly from the entry cache,

1328

# rather copying them?

1329

self._safe_to_return_from_cache = False

1330

1331

@property

1332

def user_transport(self):

1333

return self.bzrdir.user_transport

1334

1335

@property

1336

def control_transport(self):

1337

return self._transport

1338

1187

1339

1188

def __repr__(self):

1340

if self._fallback_repositories:

1341

return '%s(%r, fallback_repositories=%r)' % (

1342

self.__class__.__name__,

1343

self.base,

1344

self._fallback_repositories)

1345

else:

1346

return '%s(%r)' % (self.__class__.__name__,

1347

self.base)

1348

1349

def _has_same_fallbacks(self, other_repo):

1350

"""Returns true if the repositories have the same fallbacks."""

1351

my_fb = self._fallback_repositories

1352

other_fb = other_repo._fallback_repositories

1353

if len(my_fb) != len(other_fb):

1354

return False

1355

for f, g in zip(my_fb, other_fb):

1356

if not f.has_same_location(g):

1357

return False

1358

return True

1189

return '%s(%r)' % (self.__class__.__name__,

1190

self.base)

1359

1191

1360

1192

def has_same_location(self, other):

1361

1193

"""Returns a boolean indicating if this repository is at the same

1389

1221

data during reads, and allows a 'write_group' to be obtained. Write

1390

1222

groups must be used for actual data insertion.

1391

1223

1392

A token should be passed in if you know that you have locked the object

1393

some other way, and need to synchronise this object's state with that

1394

fact.

1395

1396

XXX: this docstring is duplicated in many places, e.g. lockable_files.py

1397

1398

1224

:param token: if this is already locked, then lock_write will fail

1399

1225

unless the token matches the existing lock.

1400

1226

:returns: a token if this instance supports tokens, otherwise None.

1403

1229

:raises MismatchedToken: if the specified token doesn't match the token

1404

1230

of the existing lock.

1405

1231

:seealso: start_write_group.

1406

:return: A RepositoryWriteLockResult.

1232

1233

A token should be passed in if you know that you have locked the object

1234

some other way, and need to synchronise this object's state with that

1235

fact.

1236

1237

XXX: this docstring is duplicated in many places, e.g. lockable_files.py

1407

1238

"""

1408

1239

locked = self.is_locked()

1409

token = self.control_files.lock_write(token=token)

1240

result = self.control_files.lock_write(token=token)

1410

1241

if not locked:

1411

self._warn_if_deprecated()

1412

self._note_lock('w')

1413

1242

for repo in self._fallback_repositories:

1414

1243

# Writes don't affect fallback repos

1415

1244

repo.lock_read()

1416

1245

self._refresh_data()

1417

return RepositoryWriteLockResult(self.unlock, token)

1246

return result

1418

1247

1419

1248

def lock_read(self):

1420

"""Lock the repository for read operations.

1421

1422

:return: An object with an unlock method which will release the lock

1423

obtained.

1424

"""

1425

1249

locked = self.is_locked()

1426

1250

self.control_files.lock_read()

1427

1251

if not locked:

1428

self._warn_if_deprecated()

1429

self._note_lock('r')

1430

1252

for repo in self._fallback_repositories:

1431

1253

repo.lock_read()

1432

1254

self._refresh_data()

1433

return self

1434

1255

1435

1256

def get_physical_lock_status(self):

1436

1257

return self.control_files.get_physical_lock_status()

1496

1317

1497

1318

# now gather global repository information

1498

1319

# XXX: This is available for many repos regardless of listability.

1499

if self.user_transport.listable():

1320

if self.bzrdir.root_transport.listable():

1500

1321

# XXX: do we want to __define len__() ?

1501

1322

# Maybe the versionedfiles object should provide a different

1502

1323

# method to get the number of keys.

1512

1333

:param using: If True, list only branches using this repository.

1513

1334

"""

1514

1335

if using and not self.is_shared():

1515

return self.bzrdir.list_branches()

1336

try:

1337

return [self.bzrdir.open_branch()]

1338

except errors.NotBranchError:

1339

return []

1516

1340

class Evaluator(object):

1517

1341

1518

1342

def __init__(self):

1527

1351

except errors.NoRepositoryPresent:

1528

1352

pass

1529

1353

else:

1530

return False, ([], repository)

1354

return False, (None, repository)

1531

1355

self.first_call = False

1532

value = (bzrdir.list_branches(), None)

1356

try:

1357

value = (bzrdir.open_branch(), None)

1358

except errors.NotBranchError:

1359

value = (None, None)

1533

1360

return True, value

1534

1361

1535

ret = []

1536

for branches, repository in bzrdir.BzrDir.find_bzrdirs(

1537

self.user_transport, evaluate=Evaluator()):

1538

if branches is not None:

1539

ret.extend(branches)

1362

branches = []

1363

for branch, repository in bzrdir.BzrDir.find_bzrdirs(

1364

self.bzrdir.root_transport, evaluate=Evaluator()):

1365

if branch is not None:

1366

branches.append(branch)

1540

1367

if not using and repository is not None:

1541

ret.extend(repository.find_branches())

1542

return ret

1368

branches.extend(repository.find_branches())

1369

return branches

1543

1370

1544

1371

@needs_read_lock

1545

1372

def search_missing_revision_ids(self, other, revision_id=None, find_ghosts=True):

1574

1401

"""Commit the contents accrued within the current write group.

1575

1402

1576

1403

:seealso: start_write_group.

1577

1578

:return: it may return an opaque hint that can be passed to 'pack'.

1579

1404

"""

1580

1405

if self._write_group is not self.get_transaction():

1581

1406

# has an unlock or relock occured ?

1635

1460

# but at the moment we're only checking for texts referenced by

1636

1461

# inventories at the graph's edge.

1637

1462

key_deps = self.revisions._index._key_dependencies

1638

key_deps.satisfy_refs_for_keys(present_inventories)

1463

key_deps.add_keys(present_inventories)

1639

1464

referrers = frozenset(r[0] for r in key_deps.get_referrers())

1640

1465

file_ids = self.fileids_altered_by_revision_ids(referrers)

1641

1466

missing_texts = set()

1707

1532

raise errors.InternalBzrError(

1708

1533

"May not fetch while in a write group.")

1709

1534

# fast path same-url fetch operations

1710

# TODO: lift out to somewhere common with RemoteRepository

1711

# <https://bugs.edge.launchpad.net/bzr/+bug/401646>

1712

if (self.has_same_location(source)

1713

and fetch_spec is None

1714

and self._has_same_fallbacks(source)):

1535

if self.has_same_location(source) and fetch_spec is None:

1715

1536

# check that last_revision is in 'from' and then return a

1716

1537

# no-operation.

1717

1538

if (revision_id is not None and

1742

1563

:param revprops: Optional dictionary of revision properties.

1743

1564

:param revision_id: Optional revision id.

1744

1565

"""

1745

if self._fallback_repositories:

1746

raise errors.BzrError("Cannot commit from a lightweight checkout "

1747

"to a stacked branch. See "

1748

"https://bugs.launchpad.net/bzr/+bug/375013 for details.")

1749

1566

result = self._commit_builder_class(self, parents, config,

1750

1567

timestamp, timezone, committer, revprops, revision_id)

1751

1568

self.start_write_group()

1752

1569

return result

1753

1570

1754

@only_raises(errors.LockNotHeld, errors.LockBroken)

1755

1571

def unlock(self):

1756

1572

if (self.control_files._lock_count == 1 and

1757

1573

self.control_files._lock_mode == 'w'):

1879

1695

1880

1696

@needs_read_lock

1881

1697

def get_revisions(self, revision_ids):

1882

"""Get many revisions at once.

1883

1884

Repositories that need to check data on every revision read should

1885

subclass this method.

1886

"""

1698

"""Get many revisions at once."""

1887

1699

return self._get_revisions(revision_ids)

1888

1700

1889

1701

@needs_read_lock

1890

1702

def _get_revisions(self, revision_ids):

1891

1703

"""Core work logic to get many revisions without sanity checks."""

1704

for rev_id in revision_ids:

1705

if not rev_id or not isinstance(rev_id, basestring):

1706

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1707

keys = [(key,) for key in revision_ids]

1708

stream = self.revisions.get_record_stream(keys, 'unordered', True)

1892

1709

revs = {}

1893

for revid, rev in self._iter_revisions(revision_ids):

1894

if rev is None:

1895

raise errors.NoSuchRevision(self, revid)

1896

revs[revid] = rev

1710

for record in stream:

1711

if record.storage_kind == 'absent':

1712

raise errors.NoSuchRevision(self, record.key[0])

1713

text = record.get_bytes_as('fulltext')

1714

rev = self._serializer.read_revision_from_string(text)

1715

revs[record.key[0]] = rev

1897

1716

return [revs[revid] for revid in revision_ids]

1898

1717

1899

def _iter_revisions(self, revision_ids):

1900

"""Iterate over revision objects.

1901

1902

:param revision_ids: An iterable of revisions to examine. None may be

1903

passed to request all revisions known to the repository. Note that

1904

not all repositories can find unreferenced revisions; for those

1905

repositories only referenced ones will be returned.

1906

:return: An iterator of (revid, revision) tuples. Absent revisions (

1907

those asked for but not available) are returned as (revid, None).

1908

"""

1909

if revision_ids is None:

1910

revision_ids = self.all_revision_ids()

1911

else:

1912

for rev_id in revision_ids:

1913

if not rev_id or not isinstance(rev_id, basestring):

1914

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1915

keys = [(key,) for key in revision_ids]

1916

stream = self.revisions.get_record_stream(keys, 'unordered', True)

1917

for record in stream:

1918

revid = record.key[0]

1919

if record.storage_kind == 'absent':

1920

yield (revid, None)

1921

else:

1922

text = record.get_bytes_as('fulltext')

1923

rev = self._serializer.read_revision_from_string(text)

1924

yield (revid, rev)

1718

@needs_read_lock

1719

def get_revision_xml(self, revision_id):

1720

# TODO: jam 20070210 This shouldn't be necessary since get_revision

1721

# would have already do it.

1722

# TODO: jam 20070210 Just use _serializer.write_revision_to_string()

1723

# TODO: this can't just be replaced by:

1724

# return self._serializer.write_revision_to_string(

1725

# self.get_revision(revision_id))

1726

# as cStringIO preservers the encoding unlike write_revision_to_string

1727

# or some other call down the path.

1728

rev = self.get_revision(revision_id)

1729

rev_tmp = cStringIO.StringIO()

1730

# the current serializer..

1731

self._serializer.write_revision(rev, rev_tmp)

1732

rev_tmp.seek(0)

1733

return rev_tmp.getvalue()

1925

1734

1926

1735

def get_deltas_for_revisions(self, revisions, specific_fileids=None):

1927

1736

"""Produce a generator of revision deltas.

2170

1979

"""

2171

1980

selected_keys = set((revid,) for revid in revision_ids)

2172

1981

w = _inv_weave or self.inventories

2173

return self._find_file_ids_from_xml_inventory_lines(

2174

w.iter_lines_added_or_present_in_keys(

2175

selected_keys, pb=None),

2176

selected_keys)

1982

pb = ui.ui_factory.nested_progress_bar()

1983

try:

1984

return self._find_file_ids_from_xml_inventory_lines(

1985

w.iter_lines_added_or_present_in_keys(

1986

selected_keys, pb=pb),

1987

selected_keys)

1988

finally:

1989

pb.finished()

2177

1990

2178

1991

def iter_files_bytes(self, desired_files):

2179

1992

"""Iterate through file versions.

2261

2074

batch_size]

2262

2075

if not to_query:

2263

2076

break

2264

for revision_id in to_query:

2077

for rev_tree in self.revision_trees(to_query):

2078

revision_id = rev_tree.get_revision_id()

2265

2079

parent_ids = ancestors[revision_id]

2266

2080

for text_key in revision_keys[revision_id]:

2267

2081

pb.update("Calculating text parents", processed_texts)

2340

2154

num_file_ids = len(file_ids)

2341

2155

for file_id, altered_versions in file_ids.iteritems():

2342

2156

if pb is not None:

2343

pb.update("Fetch texts", count, num_file_ids)

2157

pb.update("fetch texts", count, num_file_ids)

2344

2158

count += 1

2345

2159

yield ("file", file_id, altered_versions)

2346

2160

2367

2181

"""Get Inventory object by revision id."""

2368

2182

return self.iter_inventories([revision_id]).next()

2369

2183

2370

def iter_inventories(self, revision_ids, ordering=None):

2184

def iter_inventories(self, revision_ids):

2371

2185

"""Get many inventories by revision_ids.

2372

2186

2373

2187

This will buffer some or all of the texts used in constructing the

2375

2189

time.

2376

2190

2377

2191

:param revision_ids: The expected revision ids of the inventories.

2378

:param ordering: optional ordering, e.g. 'topological'. If not

2379

specified, the order of revision_ids will be preserved (by

2380

buffering if necessary).

2381

2192

:return: An iterator of inventories.

2382

2193

"""

2383

2194

if ((None in revision_ids)

2384

2195

or (_mod_revision.NULL_REVISION in revision_ids)):

2385

2196

raise ValueError('cannot get null revision inventory')

2386

return self._iter_inventories(revision_ids, ordering)

2197

return self._iter_inventories(revision_ids)

2387

2198

2388

def _iter_inventories(self, revision_ids, ordering):

2199

def _iter_inventories(self, revision_ids):

2389

2200

"""single-document based inventory iteration."""

2390

inv_xmls = self._iter_inventory_xmls(revision_ids, ordering)

2391

for text, revision_id in inv_xmls:

2392

yield self._deserialise_inventory(revision_id, text)

2201

for text, revision_id in self._iter_inventory_xmls(revision_ids):

2202

yield self.deserialise_inventory(revision_id, text)

2393

2203

2394

def _iter_inventory_xmls(self, revision_ids, ordering):

2395

if ordering is None:

2396

order_as_requested = True

2397

ordering = 'unordered'

2398

else:

2399

order_as_requested = False

2204

def _iter_inventory_xmls(self, revision_ids):

2400

2205

keys = [(revision_id,) for revision_id in revision_ids]

2401

if not keys:

2402

return

2403

if order_as_requested:

2404

key_iter = iter(keys)

2405

next_key = key_iter.next()

2406

stream = self.inventories.get_record_stream(keys, ordering, True)

2206

stream = self.inventories.get_record_stream(keys, 'unordered', True)

2407

2207

text_chunks = {}

2408

2208

for record in stream:

2409

2209

if record.storage_kind != 'absent':

2410

chunks = record.get_bytes_as('chunked')

2411

if order_as_requested:

2412

text_chunks[record.key] = chunks

2413

else:

2414

yield ''.join(chunks), record.key[-1]

2210

text_chunks[record.key] = record.get_bytes_as('chunked')

2415

2211

else:

2416

2212

raise errors.NoSuchRevision(self, record.key)

2417

if order_as_requested:

2418

# Yield as many results as we can while preserving order.

2419

while next_key in text_chunks:

2420

chunks = text_chunks.pop(next_key)

2421

yield ''.join(chunks), next_key[-1]

2422

try:

2423

next_key = key_iter.next()

2424

except StopIteration:

2425

# We still want to fully consume the get_record_stream,

2426

# just in case it is not actually finished at this point

2427

next_key = None

2428

break

2213

for key in keys:

2214

chunks = text_chunks.pop(key)

2215

yield ''.join(chunks), key[-1]

2429

2216

2430

def _deserialise_inventory(self, revision_id, xml):

2217

def deserialise_inventory(self, revision_id, xml):

2431

2218

"""Transform the xml into an inventory object.

2432

2219

2433

2220

:param revision_id: The expected revision id of the inventory.

2434

2221

:param xml: A serialised inventory.

2435

2222

"""

2436

2223

result = self._serializer.read_inventory_from_string(xml, revision_id,

2437

entry_cache=self._inventory_entry_cache,

2438

return_from_cache=self._safe_to_return_from_cache)

2224

entry_cache=self._inventory_entry_cache)

2439

2225

if result.revision_id != revision_id:

2440

2226

raise AssertionError('revision id mismatch %s != %s' % (

2441

2227

result.revision_id, revision_id))

2442

2228

return result

2443

2229

2230

def serialise_inventory(self, inv):

2231

return self._serializer.write_inventory_to_string(inv)

2232

2233

def _serialise_inventory_to_lines(self, inv):

2234

return self._serializer.write_inventory_to_lines(inv)

2235

2444

2236

def get_serializer_format(self):

2445

2237

return self._serializer.format_num

2446

2238

2447

2239

@needs_read_lock

2448

def _get_inventory_xml(self, revision_id):

2449

"""Get serialized inventory as a string."""

2450

texts = self._iter_inventory_xmls([revision_id], 'unordered')

2240

def get_inventory_xml(self, revision_id):

2241

"""Get inventory XML as a file object."""

2242

texts = self._iter_inventory_xmls([revision_id])

2451

2243

try:

2452

2244

text, revision_id = texts.next()

2453

2245

except StopIteration:

2454

2246

raise errors.HistoryMissing(self, 'inventory', revision_id)

2455

2247

return text

2456

2248

2249

@needs_read_lock

2250

def get_inventory_sha1(self, revision_id):

2251

"""Return the sha1 hash of the inventory entry

2252

"""

2253

return self.get_revision(revision_id).inventory_sha1

2254

2457

2255

def get_rev_id_for_revno(self, revno, known_pair):

2458

2256

"""Return the revision id of a revno, given a later (revno, revid)

2459

2257

pair in the same history.

2510

2308

else:

2511

2309

next_id = parents[0]

2512

2310

2311

@needs_read_lock

2312

def get_revision_inventory(self, revision_id):

2313

"""Return inventory of a past revision."""

2314

# TODO: Unify this with get_inventory()

2315

# bzr 0.0.6 and later imposes the constraint that the inventory_id

2316

# must be the same as its revision, so this is trivial.

2317

if revision_id is None:

2318

# This does not make sense: if there is no revision,

2319

# then it is the current tree inventory surely ?!

2320

# and thus get_root_id() is something that looks at the last

2321

# commit on the branch, and the get_root_id is an inventory check.

2322

raise NotImplementedError

2323

# return Inventory(self.get_root_id())

2324

else:

2325

return self.get_inventory(revision_id)

2326

2513

2327

def is_shared(self):

2514

2328

"""Return True if this repository is flagged as a shared repository."""

2515

2329

raise NotImplementedError(self.is_shared)

2549

2363

return RevisionTree(self, Inventory(root_id=None),

2550

2364

_mod_revision.NULL_REVISION)

2551

2365

else:

2552

inv = self.get_inventory(revision_id)

2366

inv = self.get_revision_inventory(revision_id)

2553

2367

return RevisionTree(self, inv, revision_id)

2554

2368

2555

2369

def revision_trees(self, revision_ids):

2608

2422

keys = tsort.topo_sort(parent_map)

2609

2423

return [None] + list(keys)

2610

2424

2611

def pack(self, hint=None, clean_obsolete_packs=False):

2425

def pack(self, hint=None):

2612

2426

"""Compress the data within the repository.

2613

2427

2614

2428

This operation only makes sense for some repository types. For other

2624

2438

obtained from the result of commit_write_group(). Out of

2625

2439

date hints are simply ignored, because concurrent operations

2626

2440

can obsolete them rapidly.

2627

2628

:param clean_obsolete_packs: Clean obsolete packs immediately after

2629

the pack operation.

2630

2441

"""

2631

2442

2632

2443

def get_transaction(self):

2648

2459

for ((revision_id,), parent_keys) in \

2649

2460

self.revisions.get_parent_map(query_keys).iteritems():

2650

2461

if parent_keys:

2651

result[revision_id] = tuple([parent_revid

2652

for (parent_revid,) in parent_keys])

2462

result[revision_id] = tuple(parent_revid

2463

for (parent_revid,) in parent_keys)

2653

2464

else:

2654

2465

result[revision_id] = (_mod_revision.NULL_REVISION,)

2655

2466

return result

2657

2468

def _make_parents_provider(self):

2658

2469

return self

2659

2470

2660

@needs_read_lock

2661

def get_known_graph_ancestry(self, revision_ids):

2662

"""Return the known graph for a set of revision ids and their ancestors.

2663

"""

2664

st = static_tuple.StaticTuple

2665

revision_keys = [st(r_id).intern() for r_id in revision_ids]

2666

known_graph = self.revisions.get_known_graph_ancestry(revision_keys)

2667

return graph.GraphThunkIdsToKeys(known_graph)

2668

2669

2471

def get_graph(self, other_repository=None):

2670

2472

"""Return the graph walker for this repository format"""

2671

2473

parents_provider = self._make_parents_provider()

2675

2477

[parents_provider, other_repository._make_parents_provider()])

2676

2478

return graph.Graph(parents_provider)

2677

2479

2678

def _get_versioned_file_checker(self, text_key_references=None,

2679

ancestors=None):

2480

def _get_versioned_file_checker(self, text_key_references=None):

2680

2481

"""Return an object suitable for checking versioned files.

2681

2482

2682

2483

:param text_key_references: if non-None, an already built

2684

2485

to whether they were referred to by the inventory of the

2685

2486

revision_id that they contain. If None, this will be

2686

2487

calculated.

2687

:param ancestors: Optional result from

2688

self.get_graph().get_parent_map(self.all_revision_ids()) if already

2689

available.

2690

2488

"""

2691

2489

return _VersionedFileChecker(self,

2692

text_key_references=text_key_references, ancestors=ancestors)

2490

text_key_references=text_key_references)

2693

2491

2694

2492

def revision_ids_to_search_result(self, result_set):

2695

2493

"""Convert a set of revision ids to a graph SearchResult."""

2745

2543

return record.get_bytes_as('fulltext')

2746

2544

2747

2545

@needs_read_lock

2748

def check(self, revision_ids=None, callback_refs=None, check_repo=True):

2546

def check(self, revision_ids=None):

2749

2547

"""Check consistency of all history of given revision_ids.

2750

2548

2751

2549

Different repository implementations should override _check().

2752

2550

2753

2551

:param revision_ids: A non-empty list of revision_ids whose ancestry

2754

2552

will be checked. Typically the last revision_id of a branch.

2755

:param callback_refs: A dict of check-refs to resolve and callback

2756

the check/_check method on the items listed as wanting the ref.

2757

see bzrlib.check.

2758

:param check_repo: If False do not check the repository contents, just

2759

calculate the data callback_refs requires and call them back.

2760

2553

"""

2761

return self._check(revision_ids, callback_refs=callback_refs,

2762

check_repo=check_repo)

2554

return self._check(revision_ids)

2763

2555

2764

def _check(self, revision_ids, callback_refs, check_repo):

2765

result = check.Check(self, check_repo=check_repo)

2766

result.check(callback_refs)

2556

def _check(self, revision_ids):

2557

result = check.Check(self)

2558

result.check()

2767

2559

return result

2768

2560

2769

def _warn_if_deprecated(self, branch=None):

2561

def _warn_if_deprecated(self):

2770

2562

global _deprecation_warning_done

2771

2563

if _deprecation_warning_done:

2772

2564

return

2773

try:

2774

if branch is None:

2775

conf = config.GlobalConfig()

2776

else:

2777

conf = branch.get_config()

2778

if conf.suppress_warning('format_deprecation'):

2779

return

2780

warning("Format %s for %s is deprecated -"

2781

" please use 'bzr upgrade' to get better performance"

2782

% (self._format, self.bzrdir.transport.base))

2783

finally:

2784

_deprecation_warning_done = True

2565

_deprecation_warning_done = True

2566

warning("Format %s for %s is deprecated - please use 'bzr upgrade' to get better performance"

2567

% (self._format, self.bzrdir.transport.base))

2785

2568

2786

2569

def supports_rich_root(self):

2787

2570

return self._format.rich_root_data

3068

2851

# help), and for fetching when data won't have come from the same

3069

2852

# compressor.

3070

2853

pack_compresses = False

3071

# Does the repository inventory storage understand references to trees?

3072

supports_tree_reference = None

3073

# Is the format experimental ?

3074

experimental = False

3075

2854

3076

def __repr__(self):

3077

return "%s()" % self.__class__.__name__

2855

def __str__(self):

2856

return "<%s>" % self.__class__.__name__

3078

2857

3079

2858

def __eq__(self, other):

3080

2859

# format objects are generally stateless

3093

2872

"""

3094

2873

try:

3095

2874

transport = a_bzrdir.get_repository_transport(None)

3096

format_string = transport.get_bytes("format")

2875

format_string = transport.get("format").read()

3097

2876

return format_registry.get(format_string)

3098

2877

except errors.NoSuchFile:

3099

2878

raise errors.NoRepositoryPresent(a_bzrdir)

3181

2960

raise NotImplementedError(self.network_name)

3182

2961

3183

2962

def check_conversion_target(self, target_format):

3184

if self.rich_root_data and not target_format.rich_root_data:

3185

raise errors.BadConversionTarget(

3186

'Does not support rich root data.', target_format,

3187

from_format=self)

3188

if (self.supports_tree_reference and

3189

not getattr(target_format, 'supports_tree_reference', False)):

3190

raise errors.BadConversionTarget(

3191

'Does not support nested trees', target_format,

3192

from_format=self)

2963

raise NotImplementedError(self.check_conversion_target)

3193

2964

3194

2965

def open(self, a_bzrdir, _found=False):

3195

2966

"""Return an instance of this format for the bzrdir a_bzrdir.

3198

2969

"""

3199

2970

raise NotImplementedError(self.open)

3200

2971

3201

def _run_post_repo_init_hooks(self, repository, a_bzrdir, shared):

3202

from bzrlib.bzrdir import BzrDir, RepoInitHookParams

3203

hooks = BzrDir.hooks['post_repo_init']

3204

if not hooks:

3205

return

3206

params = RepoInitHookParams(repository, self, a_bzrdir, shared)

3207

for hook in hooks:

3208

hook(params)

3209

3210

2972

3211

2973

class MetaDirRepositoryFormat(RepositoryFormat):

3212

2974

"""Common base class for the new repositories using the metadir layout."""

3417

3179

3418

3180

:param revision_id: if None all content is copied, if NULL_REVISION no

3419

3181

content is copied.

3420

:param pb: ignored.

3182

:param pb: optional progress bar to use for progress reports. If not

3183

provided a default one will be created.

3421

3184

:return: None.

3422

3185

"""

3423

ui.ui_factory.warn_experimental_format_fetch(self)

3424

3186

from bzrlib.fetch import RepoFetcher

3425

# See <https://launchpad.net/bugs/456077> asking for a warning here

3426

if self.source._format.network_name() != self.target._format.network_name():

3427

ui.ui_factory.show_user_warning('cross_format_fetch',

3428

from_format=self.source._format,

3429

to_format=self.target._format)

3430

3187

f = RepoFetcher(to_repository=self.target,

3431

3188

from_repository=self.source,

3432

3189

last_revision=revision_id,

3433

3190

fetch_spec=fetch_spec,

3434

find_ghosts=find_ghosts)

3191

pb=pb, find_ghosts=find_ghosts)

3435

3192

3436

3193

def _walk_to_common_revisions(self, revision_ids):

3437

3194

"""Walk out from revision_ids in source to revisions target has.

3606

3363

self.target.texts.insert_record_stream(

3607

3364

self.source.texts.get_record_stream(

3608

3365

self.source.texts.keys(), 'topological', False))

3609

pb.update('Copying inventory', 0, 1)

3366

pb.update('copying inventory', 0, 1)

3610

3367

self.target.inventories.insert_record_stream(

3611

3368

self.source.inventories.get_record_stream(

3612

3369

self.source.inventories.keys(), 'topological', False))

3738

3495

# This is redundant with format.check_conversion_target(), however that

3739

3496

# raises an exception, and we just want to say "False" as in we won't

3740

3497

# support converting between these formats.

3741

if 'IDS_never' in debug.debug_flags:

3742

return False

3743

3498

if source.supports_rich_root() and not target.supports_rich_root():

3744

3499

return False

3745

3500

if (source._format.supports_tree_reference

3746

3501

and not target._format.supports_tree_reference):

3747

3502

return False

3748

if target._fallback_repositories and target._format.supports_chks:

3749

# IDS doesn't know how to copy CHKs for the parent inventories it

3750

# adds to stacked repos.

3751

return False

3752

if 'IDS_always' in debug.debug_flags:

3753

return True

3754

# Only use this code path for local source and target. IDS does far

3755

# too much IO (both bandwidth and roundtrips) over a network.

3756

if not source.bzrdir.transport.base.startswith('file:///'):

3757

return False

3758

if not target.bzrdir.transport.base.startswith('file:///'):

3759

return False

3760

3503

return True

3761

3504

3762

def _get_trees(self, revision_ids, cache):

3763

possible_trees = []

3764

for rev_id in revision_ids:

3765

if rev_id in cache:

3766

possible_trees.append((rev_id, cache[rev_id]))

3767

else:

3768

# Not cached, but inventory might be present anyway.

3769

try:

3770

tree = self.source.revision_tree(rev_id)

3771

except errors.NoSuchRevision:

3772

# Nope, parent is ghost.

3773

pass

3774

else:

3775

cache[rev_id] = tree

3776

possible_trees.append((rev_id, tree))

3777

return possible_trees

3778

3779

def _get_delta_for_revision(self, tree, parent_ids, possible_trees):

3505

def _get_delta_for_revision(self, tree, parent_ids, basis_id, cache):

3780

3506

"""Get the best delta and base for this revision.

3781

3507

3782

3508

:return: (basis_id, delta)

3783

3509

"""

3510

possible_trees = [(parent_id, cache[parent_id])

3511

for parent_id in parent_ids

3512

if parent_id in cache]

3513

if len(possible_trees) == 0:

3514

# There either aren't any parents, or the parents aren't in the

3515

# cache, so just use the last converted tree

3516

possible_trees.append((basis_id, cache[basis_id]))

3784

3517

deltas = []

3785

# Generate deltas against each tree, to find the shortest.

3786

texts_possibly_new_in_tree = set()

3787

3518

for basis_id, basis_tree in possible_trees:

3788

3519

delta = tree.inventory._make_delta(basis_tree.inventory)

3789

for old_path, new_path, file_id, new_entry in delta:

3790

if new_path is None:

3791

# This file_id isn't present in the new rev, so we don't

3792

# care about it.

3793

continue

3794

if not new_path:

3795

# Rich roots are handled elsewhere...

3796

continue

3797

kind = new_entry.kind

3798

if kind != 'directory' and kind != 'file':

3799

# No text record associated with this inventory entry.

3800

continue

3801

# This is a directory or file that has changed somehow.

3802

texts_possibly_new_in_tree.add((file_id, new_entry.revision))

3803

3520

deltas.append((len(delta), basis_id, delta))

3804

3521

deltas.sort()

3805

3522

return deltas[0][1:]

3806

3523

3807

def _fetch_parent_invs_for_stacking(self, parent_map, cache):

3808

"""Find all parent revisions that are absent, but for which the

3809

inventory is present, and copy those inventories.

3810

3811

This is necessary to preserve correctness when the source is stacked

3812

without fallbacks configured. (Note that in cases like upgrade the

3813

source may be not have _fallback_repositories even though it is

3814

stacked.)

3815

"""

3816

parent_revs = set()

3817

for parents in parent_map.values():

3818

parent_revs.update(parents)

3819

present_parents = self.source.get_parent_map(parent_revs)

3820

absent_parents = set(parent_revs).difference(present_parents)

3821

parent_invs_keys_for_stacking = self.source.inventories.get_parent_map(

3822

(rev_id,) for rev_id in absent_parents)

3823

parent_inv_ids = [key[-1] for key in parent_invs_keys_for_stacking]

3824

for parent_tree in self.source.revision_trees(parent_inv_ids):

3825

current_revision_id = parent_tree.get_revision_id()

3826

parents_parents_keys = parent_invs_keys_for_stacking[

3827

(current_revision_id,)]

3828

parents_parents = [key[-1] for key in parents_parents_keys]

3829

basis_id = _mod_revision.NULL_REVISION

3830

basis_tree = self.source.revision_tree(basis_id)

3831

delta = parent_tree.inventory._make_delta(basis_tree.inventory)

3832

self.target.add_inventory_by_delta(

3833

basis_id, delta, current_revision_id, parents_parents)

3834

cache[current_revision_id] = parent_tree

3835

3836

def _fetch_batch(self, revision_ids, basis_id, cache, a_graph=None):

3524

def _get_parent_keys(self, root_key, parent_map):

3525

"""Get the parent keys for a given root id."""

3526

root_id, rev_id = root_key

3527

# Include direct parents of the revision, but only if they used

3528

# the same root_id and are heads.

3529

parent_keys = []

3530

for parent_id in parent_map[rev_id]:

3531

if parent_id == _mod_revision.NULL_REVISION:

3532

continue

3533

if parent_id not in self._revision_id_to_root_id:

3534

# We probably didn't read this revision, go spend the

3535

# extra effort to actually check

3536

try:

3537

tree = self.source.revision_tree(parent_id)

3538

except errors.NoSuchRevision:

3539

# Ghost, fill out _revision_id_to_root_id in case we

3540

# encounter this again.

3541

# But set parent_root_id to None since we don't really know

3542

parent_root_id = None

3543

else:

3544

parent_root_id = tree.get_root_id()

3545

self._revision_id_to_root_id[parent_id] = None

3546

else:

3547

parent_root_id = self._revision_id_to_root_id[parent_id]

3548

if root_id == parent_root_id:

3549

# With stacking we _might_ want to refer to a non-local

3550

# revision, but this code path only applies when we have the

3551

# full content available, so ghosts really are ghosts, not just

3552

# the edge of local data.

3553

parent_keys.append((parent_id,))

3554

else:

3555

# root_id may be in the parent anyway.

3556

try:

3557

tree = self.source.revision_tree(parent_id)

3558

except errors.NoSuchRevision:

3559

# ghost, can't refer to it.

3560

pass

3561

else:

3562

try:

3563

parent_keys.append((tree.inventory[root_id].revision,))

3564

except errors.NoSuchId:

3565

# not in the tree

3566

pass

3567

g = graph.Graph(self.source.revisions)

3568

heads = g.heads(parent_keys)

3569

selected_keys = []

3570

for key in parent_keys:

3571

if key in heads and key not in selected_keys:

3572

selected_keys.append(key)

3573

return tuple([(root_id,)+ key for key in selected_keys])

3574

3575

def _new_root_data_stream(self, root_keys_to_create, parent_map):

3576

for root_key in root_keys_to_create:

3577

parent_keys = self._get_parent_keys(root_key, parent_map)

3578

yield versionedfile.FulltextContentFactory(root_key,

3579

parent_keys, None, '')

3580

3581

def _fetch_batch(self, revision_ids, basis_id, cache):

3837

3582

"""Fetch across a few revisions.

3838

3583

3839

3584

:param revision_ids: The revisions to copy

3840

3585

:param basis_id: The revision_id of a tree that must be in cache, used

3841

3586

as a basis for delta when no other base is available

3842

3587

:param cache: A cache of RevisionTrees that we can use.

3843

:param a_graph: A Graph object to determine the heads() of the

3844

rich-root data stream.

3845

3588

:return: The revision_id of the last converted tree. The RevisionTree

3846

3589

for it will be in cache

3847

3590

"""

3853

3596

pending_deltas = []

3854

3597

pending_revisions = []

3855

3598

parent_map = self.source.get_parent_map(revision_ids)

3856

self._fetch_parent_invs_for_stacking(parent_map, cache)

3857

self.source._safe_to_return_from_cache = True

3858

3599

for tree in self.source.revision_trees(revision_ids):

3859

# Find a inventory delta for this revision.

3860

# Find text entries that need to be copied, too.

3861

3600

current_revision_id = tree.get_revision_id()

3862

3601

parent_ids = parent_map.get(current_revision_id, ())

3863

parent_trees = self._get_trees(parent_ids, cache)

3864

possible_trees = list(parent_trees)

3865

if len(possible_trees) == 0:

3866

# There either aren't any parents, or the parents are ghosts,

3867

# so just use the last converted tree.

3868

possible_trees.append((basis_id, cache[basis_id]))

3869

3602

basis_id, delta = self._get_delta_for_revision(tree, parent_ids,

3870

possible_trees)

3871

revision = self.source.get_revision(current_revision_id)

3872

pending_deltas.append((basis_id, delta,

3873

current_revision_id, revision.parent_ids))

3603

basis_id, cache)

3874

3604

if self._converting_to_rich_root:

3875

3605

self._revision_id_to_root_id[current_revision_id] = \

3876

3606

tree.get_root_id()

3877

# Determine which texts are in present in this revision but not in

3878

# any of the available parents.

3879

texts_possibly_new_in_tree = set()

3607

# Find text entries that need to be copied

3880

3608

for old_path, new_path, file_id, entry in delta:

3881

if new_path is None:

3882

# This file_id isn't present in the new rev

3883

continue

3884

if not new_path:

3885

# This is the root

3886

if not self.target.supports_rich_root():

3887

# The target doesn't support rich root, so we don't

3888

# copy

3889

continue

3890

if self._converting_to_rich_root:

3891

# This can't be copied normally, we have to insert

3892

# it specially

3893

root_keys_to_create.add((file_id, entry.revision))

3894

continue

3895

kind = entry.kind

3896

texts_possibly_new_in_tree.add((file_id, entry.revision))

3897

for basis_id, basis_tree in possible_trees:

3898

basis_inv = basis_tree.inventory

3899

for file_key in list(texts_possibly_new_in_tree):

3900

file_id, file_revision = file_key

3901

try:

3902

entry = basis_inv[file_id]

3903

except errors.NoSuchId:

3904

continue

3905

if entry.revision == file_revision:

3906

texts_possibly_new_in_tree.remove(file_key)

3907

text_keys.update(texts_possibly_new_in_tree)

3609

if new_path is not None:

3610

if not new_path:

3611

# This is the root

3612

if not self.target.supports_rich_root():

3613

# The target doesn't support rich root, so we don't

3614

# copy

3615

continue

3616

if self._converting_to_rich_root:

3617

# This can't be copied normally, we have to insert

3618

# it specially

3619

root_keys_to_create.add((file_id, entry.revision))

3620

continue

3621

text_keys.add((file_id, entry.revision))

3622

revision = self.source.get_revision(current_revision_id)

3623

pending_deltas.append((basis_id, delta,

3624

current_revision_id, revision.parent_ids))

3908

3625

pending_revisions.append(revision)

3909

3626

cache[current_revision_id] = tree

3910

3627

basis_id = current_revision_id

3911

self.source._safe_to_return_from_cache = False

3912

3628

# Copy file texts

3913

3629

from_texts = self.source.texts

3914

3630

to_texts = self.target.texts

3915

3631

if root_keys_to_create:

3916

root_stream = _mod_fetch._new_root_data_stream(

3917

root_keys_to_create, self._revision_id_to_root_id, parent_map,

3918

self.source, graph=a_graph)

3632

root_stream = self._new_root_data_stream(root_keys_to_create,

3633

parent_map)

3919

3634

to_texts.insert_record_stream(root_stream)

3920

3635

to_texts.insert_record_stream(from_texts.get_record_stream(

3921

3636

text_keys, self.target._format._fetch_order,

3928

3643

# for the new revisions that we are about to insert. We do this

3929

3644

# before adding the revisions so that no revision is added until

3930

3645

# all the inventories it may depend on are added.

3931

# Note that this is overzealous, as we may have fetched these in an

3932

# earlier batch.

3933

3646

parent_ids = set()

3934

3647

revision_ids = set()

3935

3648

for revision in pending_revisions:

3938

3651

parent_ids.difference_update(revision_ids)

3939

3652

parent_ids.discard(_mod_revision.NULL_REVISION)

3940

3653

parent_map = self.source.get_parent_map(parent_ids)

3941

# we iterate over parent_map and not parent_ids because we don't

3942

# want to try copying any revision which is a ghost

3943

for parent_tree in self.source.revision_trees(parent_map):

3654

for parent_tree in self.source.revision_trees(parent_ids):

3655

basis_id, delta = self._get_delta_for_revision(tree, parent_ids, basis_id, cache)

3944

3656

current_revision_id = parent_tree.get_revision_id()

3945

3657

parents_parents = parent_map[current_revision_id]

3946

possible_trees = self._get_trees(parents_parents, cache)

3947

if len(possible_trees) == 0:

3948

# There either aren't any parents, or the parents are

3949

# ghosts, so just use the last converted tree.

3950

possible_trees.append((basis_id, cache[basis_id]))

3951

basis_id, delta = self._get_delta_for_revision(parent_tree,

3952

parents_parents, possible_trees)

3953

3658

self.target.add_inventory_by_delta(

3954

3659

basis_id, delta, current_revision_id, parents_parents)

3955

3660

# insert signatures and revisions

3969

3674

3970

3675

:param revision_ids: The list of revisions to fetch. Must be in

3971

3676

topological order.

3972

:param pb: A ProgressTask

3677

:param pb: A ProgressBar

3973

3678

:return: None

3974

3679

"""

3975

3680

basis_id, basis_tree = self._get_basis(revision_ids[0])

3978

3683

cache[basis_id] = basis_tree

3979

3684

del basis_tree # We don't want to hang on to it here

3980

3685

hints = []

3981

if self._converting_to_rich_root and len(revision_ids) > 100:

3982

a_graph = _mod_fetch._get_rich_root_heads_graph(self.source,

3983

revision_ids)

3984

else:

3985

a_graph = None

3986

3987

3686

for offset in range(0, len(revision_ids), batch_size):

3988

3687

self.target.start_write_group()

3989

3688

try:

3990

3689

pb.update('Transferring revisions', offset,

3991

3690

len(revision_ids))

3992

3691

batch = revision_ids[offset:offset+batch_size]

3993

basis_id = self._fetch_batch(batch, basis_id, cache,

3994

a_graph=a_graph)

3692

basis_id = self._fetch_batch(batch, basis_id, cache)

3995

3693

except:

3996

self.source._safe_to_return_from_cache = False

3997

3694

self.target.abort_write_group()

3998

3695

raise

3999

3696

else:

4011

3708

"""See InterRepository.fetch()."""

4012

3709

if fetch_spec is not None:

4013

3710

raise AssertionError("Not implemented yet...")

4014

ui.ui_factory.warn_experimental_format_fetch(self)

4015

3711

if (not self.source.supports_rich_root()

4016

3712

and self.target.supports_rich_root()):

4017

3713

self._converting_to_rich_root = True

4018

3714

self._revision_id_to_root_id = {}

4019

3715

else:

4020

3716

self._converting_to_rich_root = False

4021

# See <https://launchpad.net/bugs/456077> asking for a warning here

4022

if self.source._format.network_name() != self.target._format.network_name():

4023

ui.ui_factory.show_user_warning('cross_format_fetch',

4024

from_format=self.source._format,

4025

to_format=self.target._format)

4026

3717

revision_ids = self.target.search_missing_revision_ids(self.source,

4027

3718

revision_id, find_ghosts=find_ghosts).get_keys()

4028

3719

if not revision_ids:

4034

3725

# Walk though all revisions; get inventory deltas, copy referenced

4035

3726

# texts that delta references, insert the delta, revision and

4036

3727

# signature.

3728

first_rev = self.source.get_revision(revision_ids[0])

4037

3729

if pb is None:

4038

3730

my_pb = ui.ui_factory.nested_progress_bar()

4039

3731

pb = my_pb

4097

3789

:param to_convert: The disk object to convert.

4098

3790

:param pb: a progress bar to use for progress information.

4099

3791

"""

4100

pb = ui.ui_factory.nested_progress_bar()

3792

self.pb = pb

4101

3793

self.count = 0

4102

3794

self.total = 4

4103

3795

# this is only useful with metadir layouts - separated repo content.

4104

3796

# trigger an assertion if not such

4105

3797

repo._format.get_format_string()

4106

3798

self.repo_dir = repo.bzrdir

4107

pb.update('Moving repository to repository.backup')

3799

self.step('Moving repository to repository.backup')

4108

3800

self.repo_dir.transport.move('repository', 'repository.backup')

4109

3801

backup_transport = self.repo_dir.transport.clone('repository.backup')

4110

3802

repo._format.check_conversion_target(self.target_format)

4111

3803

self.source_repo = repo._format.open(self.repo_dir,

4112

3804

_found=True,

4113

3805

_override_transport=backup_transport)

4114

pb.update('Creating new repository')

3806

self.step('Creating new repository')

4115

3807

converted = self.target_format.initialize(self.repo_dir,

4116

3808

self.source_repo.is_shared())

4117

3809

converted.lock_write()

4118

3810

try:

4119

pb.update('Copying content')

3811

self.step('Copying content into repository.')

4120

3812

self.source_repo.copy_content_into(converted)

4121

3813

finally:

4122

3814

converted.unlock()

4123

pb.update('Deleting old repository content')

3815

self.step('Deleting old repository content.')

4124

3816

self.repo_dir.transport.delete_tree('repository.backup')

4125

ui.ui_factory.note('repository converted')

4126

pb.finished()

3817

self.pb.note('repository converted')

3818

3819

def step(self, message):

3820

"""Update the pb by a step."""

3821

self.count +=1

3822

self.pb.update(message, self.count, self.total)

4127

3823

4128

3824

4129

3825

_unescape_map = {

4158

3854

4159

3855

class _VersionedFileChecker(object):

4160

3856

4161

def __init__(self, repository, text_key_references=None, ancestors=None):

3857

def __init__(self, repository, text_key_references=None):

4162

3858

self.repository = repository

4163

3859

self.text_index = self.repository._generate_text_key_index(

4164

text_key_references=text_key_references, ancestors=ancestors)

3860

text_key_references=text_key_references)

4165

3861

4166

3862

def calculate_file_version_parents(self, text_key):

4167

3863

"""Calculate the correct parents for a file version according to

4185

3881

revision_id) tuples for versions that are present in this versioned

4186

3882

file, but not used by the corresponding inventory.

4187

3883

"""

4188

local_progress = None

4189

if progress_bar is None:

4190

local_progress = ui.ui_factory.nested_progress_bar()

4191

progress_bar = local_progress

4192

try:

4193

return self._check_file_version_parents(texts, progress_bar)

4194

finally:

4195

if local_progress:

4196

local_progress.finished()

4197

4198

def _check_file_version_parents(self, texts, progress_bar):

4199

"""See check_file_version_parents."""

4200

3884

wrong_parents = {}

4201

3885

self.file_ids = set([file_id for file_id, _ in

4202

3886

self.text_index.iterkeys()])

4203

3887

# text keys is now grouped by file_id

3888

n_weaves = len(self.file_ids)

3889

files_in_revisions = {}

3890

revisions_of_files = {}

4204

3891

n_versions = len(self.text_index)

4205

3892

progress_bar.update('loading text store', 0, n_versions)

4206

3893

parent_map = self.repository.texts.get_parent_map(self.text_index)

4208

3895

text_keys = self.repository.texts.keys()

4209

3896

unused_keys = frozenset(text_keys) - set(self.text_index)

4210

3897

for num, key in enumerate(self.text_index.iterkeys()):

4211

progress_bar.update('checking text graph', num, n_versions)

3898

if progress_bar is not None:

3899

progress_bar.update('checking text graph', num, n_versions)

4212

3900

correct_parents = self.calculate_file_version_parents(key)

4213

3901

try:

4214

3902

knit_parents = parent_map[key]

4299

3987

else:

4300

3988

new_pack.set_write_cache_size(1024*1024)

4301

3989

for substream_type, substream in stream:

4302

if 'stream' in debug.debug_flags:

4303

mutter('inserting substream: %s', substream_type)

4304

3990

if substream_type == 'texts':

4305

3991

self.target_repo.texts.insert_record_stream(substream)

4306

3992

elif substream_type == 'inventories':

4310

3996

else:

4311

3997

self._extract_and_insert_inventories(

4312

3998

substream, src_serializer)

4313

elif substream_type == 'inventory-deltas':

4314

self._extract_and_insert_inventory_deltas(

4315

substream, src_serializer)

4316

3999

elif substream_type == 'chk_bytes':

4317

4000

# XXX: This doesn't support conversions, as it assumes the

4318

4001

# conversion was done in the fetch code.

4349

4032

4350

4033

if versioned_file is None:

4351

4034

continue

4352

# TODO: key is often going to be a StaticTuple object

4353

# I don't believe we can define a method by which

4354

# (prefix,) + StaticTuple will work, though we could

4355

# define a StaticTuple.sq_concat that would allow you to

4356

# pass in either a tuple or a StaticTuple as the second

4357

# object, so instead we could have:

4358

# StaticTuple(prefix) + key here...

4359

4035

missing_keys.update((prefix,) + key for key in

4360

4036

versioned_file.get_missing_compression_parent_keys())

4361

4037

except NotImplementedError:

4376

4052

self.target_repo.pack(hint=hint)

4377

4053

return [], set()

4378

4054

4379

def _extract_and_insert_inventory_deltas(self, substream, serializer):

4380

target_rich_root = self.target_repo._format.rich_root_data

4381

target_tree_refs = self.target_repo._format.supports_tree_reference

4382

for record in substream:

4383

# Insert the delta directly

4384

inventory_delta_bytes = record.get_bytes_as('fulltext')

4385

deserialiser = inventory_delta.InventoryDeltaDeserializer()

4386

try:

4387

parse_result = deserialiser.parse_text_bytes(

4388

inventory_delta_bytes)

4389

except inventory_delta.IncompatibleInventoryDelta, err:

4390

trace.mutter("Incompatible delta: %s", err.msg)

4391

raise errors.IncompatibleRevision(self.target_repo._format)

4392

basis_id, new_id, rich_root, tree_refs, inv_delta = parse_result

4393

revision_id = new_id

4394

parents = [key[0] for key in record.parents]

4395

self.target_repo.add_inventory_by_delta(

4396

basis_id, inv_delta, revision_id, parents)

4397

4398

def _extract_and_insert_inventories(self, substream, serializer,

4399

parse_delta=None):

4055

def _extract_and_insert_inventories(self, substream, serializer):

4400

4056

"""Generate a new inventory versionedfile in target, converting data.

4401

4057

4402

4058

The inventory is retrieved from the source, (deserializing it), and

4403

4059

stored in the target (reserializing it in a different format).

4404

4060

"""

4405

target_rich_root = self.target_repo._format.rich_root_data

4406

target_tree_refs = self.target_repo._format.supports_tree_reference

4407

4061

for record in substream:

4408

# It's not a delta, so it must be a fulltext in the source

4409

# serializer's format.

4410

4062

bytes = record.get_bytes_as('fulltext')

4411

4063

revision_id = record.key[0]

4412

4064

inv = serializer.read_inventory_from_string(bytes, revision_id)

4413

4065

parents = [key[0] for key in record.parents]

4414

4066

self.target_repo.add_inventory(revision_id, inv, parents)

4415

# No need to keep holding this full inv in memory when the rest of

4416

# the substream is likely to be all deltas.

4417

del inv

4418

4067

4419

4068

def _extract_and_insert_revisions(self, substream, serializer):

4420

4069

for record in substream:

4469

4118

return [('signatures', signatures), ('revisions', revisions)]

4470

4119

4471

4120

def _generate_root_texts(self, revs):

4472

"""This will be called by get_stream between fetching weave texts and

4121

"""This will be called by __fetch between fetching weave texts and

4473

4122

fetching the inventory weave.

4123

4124

Subclasses should override this if they need to generate root texts

4125

after fetching weave texts.

4474

4126

"""

4475

4127

if self._rich_root_upgrade():

4476

return _mod_fetch.Inter1and2Helper(

4128

import bzrlib.fetch

4129

return bzrlib.fetch.Inter1and2Helper(

4477

4130

self.from_repository).generate_root_texts(revs)

4478

4131

else:

4479

4132

return []

4482

4135

phase = 'file'

4483

4136

revs = search.get_keys()

4484

4137

graph = self.from_repository.get_graph()

4485

revs = tsort.topo_sort(graph.get_parent_map(revs))

4138

revs = list(graph.iter_topo_order(revs))

4486

4139

data_to_fetch = self.from_repository.item_keys_introduced_by(revs)

4487

4140

text_keys = []

4488

4141

for knit_kind, file_id, revisions in data_to_fetch:

4507

4160

# will be valid.

4508

4161

for _ in self._generate_root_texts(revs):

4509

4162

yield _

4163

# NB: This currently reopens the inventory weave in source;

4164

# using a single stream interface instead would avoid this.

4165

from_weave = self.from_repository.inventories

4510

4166

# we fetch only the referenced inventories because we do not

4511

4167

# know for unselected inventories whether all their required

4512

4168

# texts are present in the other repository - it could be

4551

4207

if not keys:

4552

4208

# No need to stream something we don't have

4553

4209

continue

4554

if substream_kind == 'inventories':

4555

# Some missing keys are genuinely ghosts, filter those out.

4556

present = self.from_repository.inventories.get_parent_map(keys)

4557

revs = [key[0] for key in present]

4558

# Get the inventory stream more-or-less as we do for the

4559

# original stream; there's no reason to assume that records

4560

# direct from the source will be suitable for the sink. (Think

4561

# e.g. 2a -> 1.9-rich-root).

4562

for info in self._get_inventory_stream(revs, missing=True):

4563

yield info

4564

continue

4565

4566

4210

# Ask for full texts always so that we don't need more round trips

4567

4211

# after this stream.

4568

4212

# Some of the missing keys are genuinely ghosts, so filter absent

4583

4227

return (not self.from_repository._format.rich_root_data and

4584

4228

self.to_format.rich_root_data)

4585

4229

4586

def _get_inventory_stream(self, revision_ids, missing=False):

4230

def _get_inventory_stream(self, revision_ids):

4587

4231

from_format = self.from_repository._format

4588

if (from_format.supports_chks and self.to_format.supports_chks and

4589

from_format.network_name() == self.to_format.network_name()):

4590

raise AssertionError(

4591

"this case should be handled by GroupCHKStreamSource")

4592

elif 'forceinvdeltas' in debug.debug_flags:

4593

return self._get_convertable_inventory_stream(revision_ids,

4594

delta_versus_null=missing)

4595

elif from_format.network_name() == self.to_format.network_name():

4596

# Same format.

4597

return self._get_simple_inventory_stream(revision_ids,

4598

missing=missing)

4599

elif (not from_format.supports_chks and not self.to_format.supports_chks

4600

and from_format._serializer == self.to_format._serializer):

4601

# Essentially the same format.

4602

return self._get_simple_inventory_stream(revision_ids,

4603

missing=missing)

4232

if (from_format.supports_chks and self.to_format.supports_chks

4233

and (from_format._serializer == self.to_format._serializer)):

4234

# Both sides support chks, and they use the same serializer, so it

4235

# is safe to transmit the chk pages and inventory pages across

4236

# as-is.

4237

return self._get_chk_inventory_stream(revision_ids)

4238

elif (not from_format.supports_chks):

4239

# Source repository doesn't support chks. So we can transmit the

4240

# inventories 'as-is' and either they are just accepted on the

4241

# target, or the Sink will properly convert it.

4242

return self._get_simple_inventory_stream(revision_ids)

4604

4243

else:

4605

# Any time we switch serializations, we want to use an

4606

# inventory-delta based approach.

4607

return self._get_convertable_inventory_stream(revision_ids,

4608

delta_versus_null=missing)

4244

# XXX: Hack to make not-chk->chk fetch: copy the inventories as

4245

# inventories. Note that this should probably be done somehow

4246

# as part of bzrlib.repository.StreamSink. Except JAM couldn't

4247

# figure out how a non-chk repository could possibly handle

4248

# deserializing an inventory stream from a chk repo, as it

4249

# doesn't have a way to understand individual pages.

4250

return self._get_convertable_inventory_stream(revision_ids)

4609

4251

4610

def _get_simple_inventory_stream(self, revision_ids, missing=False):

4611

# NB: This currently reopens the inventory weave in source;

4612

# using a single stream interface instead would avoid this.

4252

def _get_simple_inventory_stream(self, revision_ids):

4613

4253

from_weave = self.from_repository.inventories

4614

if missing:

4615

delta_closure = True

4616

else:

4617

delta_closure = not self.delta_on_metadata()

4618

4254

yield ('inventories', from_weave.get_record_stream(

4619

4255

[(rev_id,) for rev_id in revision_ids],

4620

self.inventory_fetch_order(), delta_closure))

4621

4622

def _get_convertable_inventory_stream(self, revision_ids,

4623

delta_versus_null=False):

4624

# The two formats are sufficiently different that there is no fast

4625

# path, so we need to send just inventorydeltas, which any

4626

# sufficiently modern client can insert into any repository.

4627

# The StreamSink code expects to be able to

4628

# convert on the target, so we need to put bytes-on-the-wire that can

4629

# be converted. That means inventory deltas (if the remote is <1.19,

4630

# RemoteStreamSink will fallback to VFS to insert the deltas).

4631

yield ('inventory-deltas',

4632

self._stream_invs_as_deltas(revision_ids,

4633

delta_versus_null=delta_versus_null))

4634

4635

def _stream_invs_as_deltas(self, revision_ids, delta_versus_null=False):

4636

"""Return a stream of inventory-deltas for the given rev ids.

4637

4638

:param revision_ids: The list of inventories to transmit

4639

:param delta_versus_null: Don't try to find a minimal delta for this

4640

entry, instead compute the delta versus the NULL_REVISION. This

4641

effectively streams a complete inventory. Used for stuff like

4642

filling in missing parents, etc.

4643

"""

4256

self.inventory_fetch_order(),

4257

not self.delta_on_metadata()))

4258

4259

def _get_chk_inventory_stream(self, revision_ids):

4260

"""Fetch the inventory texts, along with the associated chk maps."""

4261

# We want an inventory outside of the search set, so that we can filter

4262

# out uninteresting chk pages. For now we use

4263

# _find_revision_outside_set, but if we had a Search with cut_revs, we

4264

# could use that instead.

4265

start_rev_id = self.from_repository._find_revision_outside_set(

4266

revision_ids)

4267

start_rev_key = (start_rev_id,)

4268

inv_keys_to_fetch = [(rev_id,) for rev_id in revision_ids]

4269

if start_rev_id != _mod_revision.NULL_REVISION:

4270

inv_keys_to_fetch.append((start_rev_id,))

4271

# Any repo that supports chk_bytes must also support out-of-order

4272

# insertion. At least, that is how we expect it to work

4273

# We use get_record_stream instead of iter_inventories because we want

4274

# to be able to insert the stream as well. We could instead fetch

4275

# allowing deltas, and then iter_inventories, but we don't know whether

4276

# source or target is more 'local' anway.

4277

inv_stream = self.from_repository.inventories.get_record_stream(

4278

inv_keys_to_fetch, 'unordered',

4279

True) # We need them as full-texts so we can find their references

4280

uninteresting_chk_roots = set()

4281

interesting_chk_roots = set()

4282

def filter_inv_stream(inv_stream):

4283

for idx, record in enumerate(inv_stream):

4284

### child_pb.update('fetch inv', idx, len(inv_keys_to_fetch))

4285

bytes = record.get_bytes_as('fulltext')

4286

chk_inv = inventory.CHKInventory.deserialise(

4287

self.from_repository.chk_bytes, bytes, record.key)

4288

if record.key == start_rev_key:

4289

uninteresting_chk_roots.add(chk_inv.id_to_entry.key())

4290

p_id_map = chk_inv.parent_id_basename_to_file_id

4291

if p_id_map is not None:

4292

uninteresting_chk_roots.add(p_id_map.key())

4293

else:

4294

yield record

4295

interesting_chk_roots.add(chk_inv.id_to_entry.key())

4296

p_id_map = chk_inv.parent_id_basename_to_file_id

4297

if p_id_map is not None:

4298

interesting_chk_roots.add(p_id_map.key())

4299

### pb.update('fetch inventory', 0, 2)

4300

yield ('inventories', filter_inv_stream(inv_stream))

4301

# Now that we have worked out all of the interesting root nodes, grab

4302

# all of the interesting pages and insert them

4303

### pb.update('fetch inventory', 1, 2)

4304

interesting = chk_map.iter_interesting_nodes(

4305

self.from_repository.chk_bytes, interesting_chk_roots,

4306

uninteresting_chk_roots)

4307

def to_stream_adapter():

4308

"""Adapt the iter_interesting_nodes result to a single stream.

4309

4310

iter_interesting_nodes returns records as it processes them, along

4311

with keys. However, we only want to return the records themselves.

4312

"""

4313

for record, items in interesting:

4314

if record is not None:

4315

yield record

4316

# XXX: We could instead call get_record_stream(records.keys())

4317

# ATM, this will always insert the records as fulltexts, and

4318

# requires that you can hang on to records once you have gone

4319

# on to the next one. Further, it causes the target to

4320

# recompress the data. Testing shows it to be faster than

4321

# requesting the records again, though.

4322

yield ('chk_bytes', to_stream_adapter())

4323

### pb.update('fetch inventory', 2, 2)

4324

4325

def _get_convertable_inventory_stream(self, revision_ids):

4326

# XXX: One of source or target is using chks, and they don't have

4327

# compatible serializations. The StreamSink code expects to be

4328

# able to convert on the target, so we need to put

4329

# bytes-on-the-wire that can be converted

4330

yield ('inventories', self._stream_invs_as_fulltexts(revision_ids))

4331

4332

def _stream_invs_as_fulltexts(self, revision_ids):

4644

4333

from_repo = self.from_repository

4334

from_serializer = from_repo._format._serializer

4645

4335

revision_keys = [(rev_id,) for rev_id in revision_ids]

4646

4336

parent_map = from_repo.inventories.get_parent_map(revision_keys)

4647

# XXX: possibly repos could implement a more efficient iter_inv_deltas

4648

# method...

4649

inventories = self.from_repository.iter_inventories(

4650

revision_ids, 'topological')

4651

format = from_repo._format

4652

invs_sent_so_far = set([_mod_revision.NULL_REVISION])

4653

inventory_cache = lru_cache.LRUCache(50)

4654

null_inventory = from_repo.revision_tree(

4655

_mod_revision.NULL_REVISION).inventory

4656

# XXX: ideally the rich-root/tree-refs flags would be per-revision, not

4657

# per-repo (e.g. streaming a non-rich-root revision out of a rich-root

4658

# repo back into a non-rich-root repo ought to be allowed)

4659

serializer = inventory_delta.InventoryDeltaSerializer(

4660

versioned_root=format.rich_root_data,

4661

tree_references=format.supports_tree_reference)

4662

for inv in inventories:

4337

for inv in self.from_repository.iter_inventories(revision_ids):

4338

# XXX: This is a bit hackish, but it works. Basically,

4339

# CHKSerializer 'accidentally' supports

4340

# read/write_inventory_to_string, even though that is never

4341

# the format that is stored on disk. It *does* give us a

4342

# single string representation for an inventory, so live with

4343

# it for now.

4344

# This would be far better if we had a 'serialized inventory

4345

# delta' form. Then we could use 'inventory._make_delta', and

4346

# transmit that. This would both be faster to generate, and

4347

# result in fewer bytes-on-the-wire.

4348

as_bytes = from_serializer.write_inventory_to_string(inv)

4663

4349

key = (inv.revision_id,)

4664

4350

parent_keys = parent_map.get(key, ())

4665

delta = None

4666

if not delta_versus_null and parent_keys:

4667

# The caller did not ask for complete inventories and we have

4668

# some parents that we can delta against. Make a delta against

4669

# each parent so that we can find the smallest.

4670

parent_ids = [parent_key[0] for parent_key in parent_keys]

4671

for parent_id in parent_ids:

4672

if parent_id not in invs_sent_so_far:

4673

# We don't know that the remote side has this basis, so

4674

# we can't use it.

4675

continue

4676

if parent_id == _mod_revision.NULL_REVISION:

4677

parent_inv = null_inventory

4678

else:

4679

parent_inv = inventory_cache.get(parent_id, None)

4680

if parent_inv is None:

4681

parent_inv = from_repo.get_inventory(parent_id)

4682

candidate_delta = inv._make_delta(parent_inv)

4683

if (delta is None or

4684

len(delta) > len(candidate_delta)):

4685

delta = candidate_delta

4686

basis_id = parent_id

4687

if delta is None:

4688

# Either none of the parents ended up being suitable, or we

4689

# were asked to delta against NULL

4690

basis_id = _mod_revision.NULL_REVISION

4691

delta = inv._make_delta(null_inventory)

4692

invs_sent_so_far.add(inv.revision_id)

4693

inventory_cache[inv.revision_id] = inv

4694

delta_serialized = ''.join(

4695

serializer.delta_to_lines(basis_id, key[-1], delta))

4696

4351

yield versionedfile.FulltextContentFactory(

4697

key, parent_keys, None, delta_serialized)

4352

key, parent_keys, None, as_bytes)

4698

4353

4699

4354

4700

4355

def _iter_for_revno(repo, partial_history_cache, stop_index=None,

Older »