/brz/remove-bazaar : revision 5200.3.2

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: Robert Collins
Date: 2010-05-06 11:08:10 UTC
mto: This revision was merged to the branch mainline in revision 5223.
Revision ID: robertc@robertcollins.net-20100506110810-h3j07fh5gmw54s25

Cleaner matcher matching revised unlocking protocol.

files added:
bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/deprecated_graph.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/util/bencode.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

tools/convertfile.py

tools/convertinv.py

tools/trace-revisions

tools/weavebench.py

files removed:
NEWS

bzrlib/cethread.py

bzrlib/cmd_test_script.py

bzrlib/controldir.py

bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/export_pot.py

bzrlib/library_state.py

bzrlib/mergetools.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/pyutils.py

bzrlib/recordcounter.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/fixtures.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_repository/test_file_graph.py

bzrlib/tests/per_repository_reference/test__make_parents_provider.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_repository_vf/test_write_group.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/scenarios.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_utextwrap.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/testui.py

bzrlib/transport/gio_transport.py

bzrlib/utextwrap.py

bzrlib/vf_repository.py

bzrlib/workingtree_3.py

contrib/bash/bzr

contrib/zsh/README

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/configuration.txt

doc/developers/documenting-changes.txt

doc/developers/fetch.txt

doc/developers/transports.txt

doc/developers/ui.txt

doc/developers/xdg_config_spec.txt

doc/en/admin-guide/licence.txt

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/series-template.txt

doc/en/tutorials/licence.txt

doc/en/upgrade-guide/licence.txt

doc/en/user-guide/licence.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/en/whats-new/whats-new-in-2.4.txt

tools/fixed-in.py

tools/win32/py2exe_boot_common.py

files renamed:
doc/en/release-notes/bzr-2.3.txt => NEWS

doc/en/release-notes/release-template.txt => NEWS-template.txt

bzrlib/doc_generate/conf.py => bzrlib/doc_generate/sphinx_conf.py

bzrlib/plugins/weave_fmt/repository.py => bzrlib/repofmt/weaverepo.py

bzrlib/tests/per_controldir/ => bzrlib/tests/per_bzrdir/

bzrlib/tests/per_controldir/test_controldir.py => bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir_colo/ => bzrlib/tests/per_bzrdir_colo/

bzrlib/tests/per_repository_vf/helpers.py => bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository_vf/test__generate_text_key_index.py => bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py => bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository_vf/test_check_reconcile.py => bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository_vf/test_find_text_key_references.py => bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_locking.py => bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/plugins/weave_fmt/xml4.py => bzrlib/xml4.py

files modified:
.bzrignore

.testr.conf

INSTALL

Makefile

README

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/crash.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/news_merge/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rules.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/status.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/features.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_bzrdir_colo/__init__.py

bzrlib/tests/per_bzrdir_colo/test_supported.py

bzrlib/tests/per_bzrdir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/pathfilter.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/util/configobj/configobj.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates/index.html

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference/readme.txt

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial/index.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/index.txt

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-reference/index.txt

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial/index.txt

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/introducing_bazaar.txt

profile_imports.py

setup.py

tools/check-newsbugs.py

tools/generate_release_notes.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/buildout.cfg

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

except ImportError:

pylzma = None

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

annotate,

config,

debug,

errors,

graph as _mod_graph,

knit,

osutils,

pack,

static_tuple,

trace,

tsort,

)

from bzrlib.repofmt import pack_repo

""")

from bzrlib.btree_index import BTreeBuilder

from bzrlib.lru_cache import LRUSizeCache

from bzrlib.tsort import topo_sort

from bzrlib.versionedfile import (

_KeyRefs,

adapter_registry,

AbsentContentFactory,

ChunkedContentFactory,

FulltextContentFactory,

VersionedFilesWithFallbacks,

VersionedFiles,

)

# Minimum number of uncompressed bytes to try fetch at once when retrieving

present_keys = []

for prefix in sorted(per_prefix_map):

present_keys.extend(reversed(tsort.topo_sort(per_prefix_map[prefix])))

present_keys.extend(reversed(topo_sort(per_prefix_map[prefix])))

return present_keys

108

101

def __init__(self):

109

102

# map by key? or just order in file?

110

103

self._compressor_name = None

111

self._z_content_chunks = None

104

self._z_content = None

112

105

self._z_content_decompressor = None

113

106

self._z_content_length = None

114

107

self._content_length = None

142

135

self._content = ''.join(self._content_chunks)

143

136

self._content_chunks = None

144

137

if self._content is None:

145

# We join self._z_content_chunks here, because if we are

146

# decompressing, then it is *very* likely that we have a single

147

# chunk

148

if self._z_content_chunks is None:

138

if self._z_content is None:

149

139

raise AssertionError('No content to decompress')

150

z_content = ''.join(self._z_content_chunks)

151

if z_content == '':

140

if self._z_content == '':

152

141

self._content = ''

153

142

elif self._compressor_name == 'lzma':

154

143

# We don't do partial lzma decomp yet

155

self._content = pylzma.decompress(z_content)

144

self._content = pylzma.decompress(self._z_content)

156

145

elif self._compressor_name == 'zlib':

157

146

# Start a zlib decompressor

158

147

if num_bytes * 4 > self._content_length * 3:

159

148

# If we are requesting more that 3/4ths of the content,

160

149

# just extract the whole thing in a single pass

161

150

num_bytes = self._content_length

162

self._content = zlib.decompress(z_content)

151

self._content = zlib.decompress(self._z_content)

163

152

else:

164

153

self._z_content_decompressor = zlib.decompressobj()

165

154

# Seed the decompressor with the uncompressed bytes, so

166

155

# that the rest of the code is simplified

167

156

self._content = self._z_content_decompressor.decompress(

168

z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

157

self._z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

169

158

if not self._z_content_decompressor.unconsumed_tail:

170

159

self._z_content_decompressor = None

171

160

else:

218

207

# XXX: Define some GCCorrupt error ?

219

208

raise AssertionError('Invalid bytes: (%d) != %d + %d' %

220

209

(len(bytes), pos, self._z_content_length))

221

self._z_content_chunks = (bytes[pos:],)

222

223

@property

224

def _z_content(self):

225

"""Return z_content_chunks as a simple string.

226

227

Meant only to be used by the test suite.

228

"""

229

if self._z_content_chunks is not None:

230

return ''.join(self._z_content_chunks)

231

return None

210

self._z_content = bytes[pos:]

232

211

233

212

@classmethod

234

213

def from_bytes(cls, bytes):

290

269

self._content_length = length

291

270

self._content_chunks = content_chunks

292

271

self._content = None

293

self._z_content_chunks = None

272

self._z_content = None

294

273

295

274

def set_content(self, content):

296

275

"""Set the content of this block."""

297

276

self._content_length = len(content)

298

277

self._content = content

299

self._z_content_chunks = None

278

self._z_content = None

300

279

301

280

def _create_z_content_using_lzma(self):

302

281

if self._content_chunks is not None:

304

283

self._content_chunks = None

305

284

if self._content is None:

306

285

raise AssertionError('Nothing to compress')

307

z_content = pylzma.compress(self._content)

308

self._z_content_chunks = (z_content,)

309

self._z_content_length = len(z_content)

286

self._z_content = pylzma.compress(self._content)

287

self._z_content_length = len(self._z_content)

310

288

311

def _create_z_content_from_chunks(self, chunks):

289

def _create_z_content_from_chunks(self):

312

290

compressor = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION)

313

# Peak in this point is 1 fulltext, 1 compressed text, + zlib overhead

314

# (measured peak is maybe 30MB over the above...)

315

compressed_chunks = map(compressor.compress, chunks)

291

compressed_chunks = map(compressor.compress, self._content_chunks)

316

292

compressed_chunks.append(compressor.flush())

317

# Ignore empty chunks

318

self._z_content_chunks = [c for c in compressed_chunks if c]

319

self._z_content_length = sum(map(len, self._z_content_chunks))

293

self._z_content = ''.join(compressed_chunks)

294

self._z_content_length = len(self._z_content)

320

295

321

296

def _create_z_content(self):

322

if self._z_content_chunks is not None:

297

if self._z_content is not None:

323

298

return

324

299

if _USE_LZMA:

325

300

self._create_z_content_using_lzma()

326

301

return

327

302

if self._content_chunks is not None:

328

chunks = self._content_chunks

329

else:

330

chunks = (self._content,)

331

self._create_z_content_from_chunks(chunks)

303

self._create_z_content_from_chunks()

304

return

305

self._z_content = zlib.compress(self._content)

306

self._z_content_length = len(self._z_content)

332

307

333

def to_chunks(self):

334

"""Create the byte stream as a series of 'chunks'"""

308

def to_bytes(self):

309

"""Encode the information into a byte stream."""

335

310

self._create_z_content()

336

311

if _USE_LZMA:

337

312

header = self.GCB_LZ_HEADER

338

313

else:

339

314

header = self.GCB_HEADER

340

chunks = ['%s%d\n%d\n'

341

% (header, self._z_content_length, self._content_length),

315

chunks = [header,

316

'%d\n%d\n' % (self._z_content_length, self._content_length),

317

self._z_content,

342

318

]

343

chunks.extend(self._z_content_chunks)

344

total_len = sum(map(len, chunks))

345

return total_len, chunks

346

347

def to_bytes(self):

348

"""Encode the information into a byte stream."""

349

total_len, chunks = self.to_chunks()

350

319

return ''.join(chunks)

351

320

352

321

def _dump(self, include_text=False):

491

460

_full_enough_block_size = 3*1024*1024 # size at which we won't repack

492

461

_full_enough_mixed_block_size = 2*768*1024 # 1.5MB

493

462

494

def __init__(self, block, get_compressor_settings=None):

463

def __init__(self, block):

495

464

self._block = block

496

465

# We need to preserve the ordering

497

466

self._factories = []

498

467

self._last_byte = 0

499

self._get_settings = get_compressor_settings

500

self._compressor_settings = None

501

502

def _get_compressor_settings(self):

503

if self._compressor_settings is not None:

504

return self._compressor_settings

505

settings = None

506

if self._get_settings is not None:

507

settings = self._get_settings()

508

if settings is None:

509

vf = GroupCompressVersionedFiles

510

settings = vf._DEFAULT_COMPRESSOR_SETTINGS

511

self._compressor_settings = settings

512

return self._compressor_settings

513

468

514

469

def add_factory(self, key, parents, start, end):

515

470

if not self._factories:

548

503

new_block.set_content(self._block._content[:last_byte])

549

504

self._block = new_block

550

505

551

def _make_group_compressor(self):

552

return GroupCompressor(self._get_compressor_settings())

553

554

506

def _rebuild_block(self):

555

507

"""Create a new GroupCompressBlock with only the referenced texts."""

556

compressor = self._make_group_compressor()

508

compressor = GroupCompressor()

557

509

tstart = time.time()

558

510

old_length = self._block._content_length

559

511

end_point = 0

571

523

# block? It seems hard to come up with a method that it would

572

524

# expand, since we do full compression again. Perhaps based on a

573

525

# request that ends up poorly ordered?

574

# TODO: If the content would have expanded, then we would want to

575

# handle a case where we need to split the block.

576

# Now that we have a user-tweakable option

577

# (max_bytes_to_index), it is possible that one person set it

578

# to a very low value, causing poor compression.

579

526

delta = time.time() - tstart

580

527

self._block = new_block

581

528

trace.mutter('creating new compressed block on-the-fly in %.3fs'

732

679

z_header_bytes = zlib.compress(header_bytes)

733

680

del header_bytes

734

681

z_header_bytes_len = len(z_header_bytes)

735

block_bytes_len, block_chunks = self._block.to_chunks()

682

block_bytes = self._block.to_bytes()

736

683

lines.append('%d\n%d\n%d\n' % (z_header_bytes_len, header_bytes_len,

737

block_bytes_len))

684

len(block_bytes)))

738

685

lines.append(z_header_bytes)

739

lines.extend(block_chunks)

740

del z_header_bytes, block_chunks

741

# TODO: This is a point where we will double the memory consumption. To

742

# avoid this, we probably have to switch to a 'chunked' api

686

lines.append(block_bytes)

687

del z_header_bytes, block_bytes

743

688

return ''.join(lines)

744

689

745

690

@classmethod

746

691

def from_bytes(cls, bytes):

747

692

# TODO: This does extra string copying, probably better to do it a

748

# different way. At a minimum this creates 2 copies of the

749

# compressed content

693

# different way

750

694

(storage_kind, z_header_len, header_len,

751

695

block_len, rest) = bytes.split('\n', 4)

752

696

del bytes

804

748

805

749

class _CommonGroupCompressor(object):

806

750

807

def __init__(self, settings=None):

751

def __init__(self):

808

752

"""Create a GroupCompressor."""

809

753

self.chunks = []

810

754

self._last = None

813

757

self.labels_deltas = {}

814

758

self._delta_index = None # Set by the children

815

759

self._block = GroupCompressBlock()

816

if settings is None:

817

self._settings = {}

818

else:

819

self._settings = settings

820

760

821

761

def compress(self, key, bytes, expected_sha, nostore_sha=None, soft=False):

822

762

"""Compress lines with label key.

914

854

915

855

After calling this, the compressor should no longer be used

916

856

"""

857

# TODO: this causes us to 'bloat' to 2x the size of content in the

858

# group. This has an impact for 'commit' of large objects.

859

# One possibility is to use self._content_chunks, and be lazy and

860

# only fill out self._content as a full string when we actually

861

# need it. That would at least drop the peak memory consumption

862

# for 'commit' down to ~1x the size of the largest file, at a

863

# cost of increased complexity within this code. 2x is still <<

864

# 3x the size of the largest file, so we are doing ok.

917

865

self._block.set_chunked_content(self.chunks, self.endpoint)

918

866

self.chunks = None

919

867

self._delta_index = None

937

885

938

886

class PythonGroupCompressor(_CommonGroupCompressor):

939

887

940

def __init__(self, settings=None):

888

def __init__(self):

941

889

"""Create a GroupCompressor.

942

890

943

891

Used only if the pyrex version is not available.

944

892

"""

945

super(PythonGroupCompressor, self).__init__(settings)

893

super(PythonGroupCompressor, self).__init__()

946

894

self._delta_index = LinesDeltaIndex([])

947

895

# The actual content is managed by LinesDeltaIndex

948

896

self.chunks = self._delta_index.lines

996

944

left side.

997

945

"""

998

946

999

def __init__(self, settings=None):

1000

super(PyrexGroupCompressor, self).__init__(settings)

1001

max_bytes_to_index = self._settings.get('max_bytes_to_index', 0)

1002

self._delta_index = DeltaIndex(max_bytes_to_index=max_bytes_to_index)

947

def __init__(self):

948

super(PyrexGroupCompressor, self).__init__()

949

self._delta_index = DeltaIndex()

1003

950

1004

951

def _compress(self, key, bytes, max_delta_size, soft=False):

1005

952

"""see _CommonGroupCompressor._compress"""

1080

1027

index = _GCGraphIndex(graph_index, lambda:True, parents=parents,

1081

1028

add_callback=graph_index.add_nodes,

1082

1029

inconsistency_fatal=inconsistency_fatal)

1083

access = pack_repo._DirectPackAccess({})

1030

access = knit._DirectPackAccess({})

1084

1031

access.set_writer(writer, graph_index, (transport, 'newpack'))

1085

1032

result = GroupCompressVersionedFiles(index, access, delta)

1086

1033

result.stream = stream

1096

1043

1097

1044

class _BatchingBlockFetcher(object):

1098

1045

"""Fetch group compress blocks in batches.

1099

1046

1100

1047

:ivar total_bytes: int of expected number of bytes needed to fetch the

1101

1048

currently pending batch.

1102

1049

"""

1103

1050

1104

def __init__(self, gcvf, locations, get_compressor_settings=None):

1051

def __init__(self, gcvf, locations):

1105

1052

self.gcvf = gcvf

1106

1053

self.locations = locations

1107

1054

self.keys = []

1110

1057

self.total_bytes = 0

1111

1058

self.last_read_memo = None

1112

1059

self.manager = None

1113

self._get_compressor_settings = get_compressor_settings

1114

1060

1115

1061

def add_key(self, key):

1116

1062

"""Add another to key to fetch.

1117

1063

1118

1064

:return: The estimated number of bytes needed to fetch the batch so

1119

1065

far.

1120

1066

"""

1145

1091

# and then.

1146

1092

self.batch_memos[read_memo] = cached_block

1147

1093

return self.total_bytes

1148

1094

1149

1095

def _flush_manager(self):

1150

1096

if self.manager is not None:

1151

1097

for factory in self.manager.get_record_stream():

1156

1102

def yield_factories(self, full_flush=False):

1157

1103

"""Yield factories for keys added since the last yield. They will be

1158

1104

returned in the order they were added via add_key.

1159

1105

1160

1106

:param full_flush: by default, some results may not be returned in case

1161

1107

they can be part of the next batch. If full_flush is True, then

1162

1108

all results are returned.

1190

1136

memos_to_get_stack.pop()

1191

1137

else:

1192

1138

block = self.batch_memos[read_memo]

1193

self.manager = _LazyGroupContentManager(block,

1194

get_compressor_settings=self._get_compressor_settings)

1139

self.manager = _LazyGroupContentManager(block)

1195

1140

self.last_read_memo = read_memo

1196

1141

start, end = index_memo[3:5]

1197

1142

self.manager.add_factory(key, parents, start, end)

1204

1149

self.total_bytes = 0

1205

1150

1206

1151

1207

class GroupCompressVersionedFiles(VersionedFilesWithFallbacks):

1152

class GroupCompressVersionedFiles(VersionedFiles):

1208

1153

"""A group-compress based VersionedFiles implementation."""

1209

1154

1210

# This controls how the GroupCompress DeltaIndex works. Basically, we

1211

# compute hash pointers into the source blocks (so hash(text) => text).

1212

# However each of these references costs some memory in trade against a

1213

# more accurate match result. For very large files, they either are

1214

# pre-compressed and change in bulk whenever they change, or change in just

1215

# local blocks. Either way, 'improved resolution' is not very helpful,

1216

# versus running out of memory trying to track everything. The default max

1217

# gives 100% sampling of a 1MB file.

1218

_DEFAULT_MAX_BYTES_TO_INDEX = 1024 * 1024

1219

_DEFAULT_COMPRESSOR_SETTINGS = {'max_bytes_to_index':

1220

_DEFAULT_MAX_BYTES_TO_INDEX}

1221

1222

def __init__(self, index, access, delta=True, _unadded_refs=None,

1223

_group_cache=None):

1155

def __init__(self, index, access, delta=True, _unadded_refs=None):

1224

1156

"""Create a GroupCompressVersionedFiles object.

1225

1157

1226

1158

:param index: The index object storing access and graph data.

1227

1159

:param access: The access object storing raw data.

1228

1160

:param delta: Whether to delta compress or just entropy compress.

1229

1161

:param _unadded_refs: private parameter, don't use.

1230

:param _group_cache: private parameter, don't use.

1231

1162

"""

1232

1163

self._index = index

1233

1164

self._access = access

1235

1166

if _unadded_refs is None:

1236

1167

_unadded_refs = {}

1237

1168

self._unadded_refs = _unadded_refs

1238

if _group_cache is None:

1239

_group_cache = LRUSizeCache(max_size=50*1024*1024)

1240

self._group_cache = _group_cache

1241

self._immediate_fallback_vfs = []

1242

self._max_bytes_to_index = None

1169

self._group_cache = LRUSizeCache(max_size=50*1024*1024)

1170

self._fallback_vfs = []

1243

1171

1244

1172

def without_fallbacks(self):

1245

1173

"""Return a clone of this object without any fallbacks configured."""

1246

1174

return GroupCompressVersionedFiles(self._index, self._access,

1247

self._delta, _unadded_refs=dict(self._unadded_refs),

1248

_group_cache=self._group_cache)

1175

self._delta, _unadded_refs=dict(self._unadded_refs))

1249

1176

1250

1177

def add_lines(self, key, parents, lines, parent_texts=None,

1251

1178

left_matching_blocks=None, nostore_sha=None, random_id=False,

1320

1247

1321

1248

:param a_versioned_files: A VersionedFiles object.

1322

1249

"""

1323

self._immediate_fallback_vfs.append(a_versioned_files)

1250

self._fallback_vfs.append(a_versioned_files)

1324

1251

1325

1252

def annotate(self, key):

1326

1253

"""See VersionedFiles.annotate."""

1360

1287

self._check_lines_not_unicode(lines)

1361

1288

self._check_lines_are_lines(lines)

1362

1289

1290

def get_known_graph_ancestry(self, keys):

1291

"""Get a KnownGraph instance with the ancestry of keys."""

1292

# Note that this is identical to

1293

# KnitVersionedFiles.get_known_graph_ancestry, but they don't share

1294

# ancestry.

1295

parent_map, missing_keys = self._index.find_ancestry(keys)

1296

for fallback in self._fallback_vfs:

1297

if not missing_keys:

1298

break

1299

(f_parent_map, f_missing_keys) = fallback._index.find_ancestry(

1300

missing_keys)

1301

parent_map.update(f_parent_map)

1302

missing_keys = f_missing_keys

1303

kg = _mod_graph.KnownGraph(parent_map)

1304

return kg

1305

1363

1306

def get_parent_map(self, keys):

1364

1307

"""Get a map of the graph parents of keys.

1365

1308

1380

1323

and so on.

1381

1324

"""

1382

1325

result = {}

1383

sources = [self._index] + self._immediate_fallback_vfs

1326

sources = [self._index] + self._fallback_vfs

1384

1327

source_results = []

1385

1328

missing = set(keys)

1386

1329

for source in sources:

1487

1430

parent_map = {}

1488

1431

key_to_source_map = {}

1489

1432

source_results = []

1490

for source in self._immediate_fallback_vfs:

1433

for source in self._fallback_vfs:

1491

1434

if not missing:

1492

1435

break

1493

1436

source_parents = source.get_parent_map(missing)

1508

1451

the defined order, regardless of source.

1509

1452

"""

1510

1453

if ordering == 'topological':

1511

present_keys = tsort.topo_sort(parent_map)

1454

present_keys = topo_sort(parent_map)

1512

1455

else:

1513

1456

# ordering == 'groupcompress'

1514

1457

# XXX: This only optimizes for the target ordering. We may need

1603

1546

# - we encounter an unadded ref, or

1604

1547

# - we run out of keys, or

1605

1548

# - the total bytes to retrieve for this batch > BATCH_SIZE

1606

batcher = _BatchingBlockFetcher(self, locations,

1607

get_compressor_settings=self._get_compressor_settings)

1549

batcher = _BatchingBlockFetcher(self, locations)

1608

1550

for source, keys in source_keys:

1609

1551

if source is self:

1610

1552

for key in keys:

1656

1598

for _ in self._insert_record_stream(stream, random_id=False):

1657

1599

pass

1658

1600

1659

def _get_compressor_settings(self):

1660

if self._max_bytes_to_index is None:

1661

# TODO: VersionedFiles don't know about their containing

1662

# repository, so they don't have much of an idea about their

1663

# location. So for now, this is only a global option.

1664

c = config.GlobalConfig()

1665

val = c.get_user_option('bzr.groupcompress.max_bytes_to_index')

1666

if val is not None:

1667

try:

1668

val = int(val)

1669

except ValueError, e:

1670

trace.warning('Value for '

1671

'"bzr.groupcompress.max_bytes_to_index"'

1672

' %r is not an integer'

1673

% (val,))

1674

val = None

1675

if val is None:

1676

val = self._DEFAULT_MAX_BYTES_TO_INDEX

1677

self._max_bytes_to_index = val

1678

return {'max_bytes_to_index': self._max_bytes_to_index}

1679

1680

def _make_group_compressor(self):

1681

return GroupCompressor(self._get_compressor_settings())

1682

1683

1601

def _insert_record_stream(self, stream, random_id=False, nostore_sha=None,

1684

1602

reuse_blocks=True):

1685

1603

"""Internal core to insert a record stream into this container.

1708

1626

return adapter

1709

1627

# This will go up to fulltexts for gc to gc fetching, which isn't

1710

1628

# ideal.

1711

self._compressor = self._make_group_compressor()

1629

self._compressor = GroupCompressor()

1712

1630

self._unadded_refs = {}

1713

1631

keys_to_add = []

1714

1632

def flush():

1715

bytes_len, chunks = self._compressor.flush().to_chunks()

1716

self._compressor = self._make_group_compressor()

1717

# Note: At this point we still have 1 copy of the fulltext (in

1718

# record and the var 'bytes'), and this generates 2 copies of

1719

# the compressed text (one for bytes, one in chunks)

1720

# TODO: Push 'chunks' down into the _access api, so that we don't

1721

# have to double compressed memory here

1722

# TODO: Figure out how to indicate that we would be happy to free

1723

# the fulltext content at this point. Note that sometimes we

1724

# will want it later (streaming CHK pages), but most of the

1725

# time we won't (everything else)

1726

bytes = ''.join(chunks)

1727

del chunks

1633

bytes = self._compressor.flush().to_bytes()

1634

self._compressor = GroupCompressor()

1728

1635

index, start, length = self._access.add_raw_records(

1729

1636

[(None, len(bytes))], bytes)[0]

1730

1637

nodes = []

1895

1802

"""See VersionedFiles.keys."""

1896

1803

if 'evil' in debug.debug_flags:

1897

1804

trace.mutter_callsite(2, "keys scales with size of history")

1898

sources = [self._index] + self._immediate_fallback_vfs

1805

sources = [self._index] + self._fallback_vfs

1899

1806

result = set()

1900

1807

for source in sources:

1901

1808

result.update(source.keys())

1902

1809

return result

1903

1810

1904

1811

1905

class _GCBuildDetails(object):

1906

"""A blob of data about the build details.

1907

1908

This stores the minimal data, which then allows compatibility with the old

1909

api, without taking as much memory.

1910

"""

1911

1912

__slots__ = ('_index', '_group_start', '_group_end', '_basis_end',

1913

'_delta_end', '_parents')

1914

1915

method = 'group'

1916

compression_parent = None

1917

1918

def __init__(self, parents, position_info):

1919

self._parents = parents

1920

(self._index, self._group_start, self._group_end, self._basis_end,

1921

self._delta_end) = position_info

1922

1923

def __repr__(self):

1924

return '%s(%s, %s)' % (self.__class__.__name__,

1925

self.index_memo, self._parents)

1926

1927

@property

1928

def index_memo(self):

1929

return (self._index, self._group_start, self._group_end,

1930

self._basis_end, self._delta_end)

1931

1932

@property

1933

def record_details(self):

1934

return static_tuple.StaticTuple(self.method, None)

1935

1936

def __getitem__(self, offset):

1937

"""Compatibility thunk to act like a tuple."""

1938

if offset == 0:

1939

return self.index_memo

1940

elif offset == 1:

1941

return self.compression_parent # Always None

1942

elif offset == 2:

1943

return self._parents

1944

elif offset == 3:

1945

return self.record_details

1946

else:

1947

raise IndexError('offset out of range')

1948

1949

def __len__(self):

1950

return 4

1951

1952

1953

1812

class _GCGraphIndex(object):

1954

1813

"""Mapper from GroupCompressVersionedFiles needs into GraphIndex storage."""

1955

1814

1984

1843

# repeated over and over, this creates a surplus of ints

1985

1844

self._int_cache = {}

1986

1845

if track_external_parent_refs:

1987

self._key_dependencies = _KeyRefs(

1846

self._key_dependencies = knit._KeyRefs(

1988

1847

track_new_keys=track_new_keys)

1989

1848

else:

1990

1849

self._key_dependencies = None

2150

2009

parents = None

2151

2010

else:

2152

2011

parents = entry[3][0]

2153

details = _GCBuildDetails(parents, self._node_to_position(entry))

2154

result[key] = details

2012

method = 'group'

2013

result[key] = (self._node_to_position(entry),

2014

None, parents, (method, None))

2155

2015

return result

2156

2016

2157

2017

def keys(self):

2173

2033

# each, or about 7MB. Note that it might be even more when you consider

2174

2034

# how PyInt is allocated in separate slabs. And you can't return a slab

2175

2035

# to the OS if even 1 int on it is in use. Note though that Python uses

2176

# a LIFO when re-using PyInt slots, which might cause more

2036

# a LIFO when re-using PyInt slots, which probably causes more

2177

2037

# fragmentation.

2178

2038

start = int(bits[0])

2179

2039

start = self._int_cache.setdefault(start, start)

Older »