/brz/remove-bazaar : revision 5755.2.8

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: John Arbash Meinel
Date: 2011-05-14 10:28:59 UTC
mto: (5755.2.10 2.4-max-entries-gc-602614)
mto: This revision was merged to the branch mainline in revision 5870.
Revision ID: john@arbash-meinel.com-20110514102859-cr98r9ycoaff88jc

Do a lot of renaming.

Change the config from 'max_entries_per_source' to 'max_bytes_to_index'.
I'm not 100% happy, because it is max_bytes_to_delta_index_per_source, but
that is just getting rediculously long.
Internally, change the code to take a 'settings' function, which currently
returns a tuple. I'm thinking to change it to a dict.

files added:
NEWS

bzrlib/cethread.py

bzrlib/cmd_test_script.py

bzrlib/controldir.py

bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/library_state.py

bzrlib/mergetools.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/pyutils.py

bzrlib/recordcounter.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/fixtures.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_repository_reference/test__make_parents_provider.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/scenarios.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/testui.py

bzrlib/transport/gio_transport.py

bzrlib/vf_repository.py

bzrlib/workingtree_3.py

contrib/bash/bzr

contrib/zsh/README

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/configuration.txt

doc/developers/documenting-changes.txt

doc/developers/fetch.txt

doc/developers/transports.txt

doc/developers/ui.txt

doc/developers/xdg_config_spec.txt

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/series-template.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/en/whats-new/whats-new-in-2.4.txt

tools/fixed-in.py

tools/win32/py2exe_boot_common.py

files removed:
bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/deprecated_graph.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/util/bencode.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

tools/convertfile.py

tools/convertinv.py

tools/trace-revisions

tools/weavebench.py

files renamed:
bzrlib/doc_generate/sphinx_conf.py => bzrlib/doc_generate/conf.py

bzrlib/repofmt/weaverepo.py => bzrlib/plugins/weave_fmt/repository.py

bzrlib/xml4.py => bzrlib/plugins/weave_fmt/xml4.py

bzrlib/tests/per_bzrdir/ => bzrlib/tests/per_controldir/

bzrlib/tests/per_bzrdir/test_bzrdir.py => bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_bzrdir_colo/ => bzrlib/tests/per_controldir_colo/

bzrlib/tests/per_repository/helpers.py => bzrlib/tests/per_repository_vf/helpers.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py => bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check_reconcile.py => bzrlib/tests/per_repository_vf/test_check_reconcile.py

NEWS => doc/en/release-notes/bzr-2.3.txt

NEWS-template.txt => doc/en/release-notes/release-template.txt

files modified:
.bzrignore

.testr.conf

INSTALL

Makefile

README

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/crash.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/news_merge/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rules.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/status.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/features.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_controldir_colo/__init__.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/pathfilter.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/util/configobj/configobj.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates/index.html

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference/readme.txt

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial/index.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/index.txt

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-reference/index.txt

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial/index.txt

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/introducing_bazaar.txt

setup.py

tools/check-newsbugs.py

tools/generate_release_notes.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/buildout.cfg

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

except ImportError:

pylzma = None

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

annotate,

config,

debug,

errors,

graph as _mod_graph,

knit,

osutils,

pack,

static_tuple,

trace,

tsort,

)

from bzrlib.repofmt import pack_repo

""")

from bzrlib.btree_index import BTreeBuilder

from bzrlib.lru_cache import LRUSizeCache

from bzrlib.tsort import topo_sort

from bzrlib.versionedfile import (

_KeyRefs,

adapter_registry,

AbsentContentFactory,

ChunkedContentFactory,

FulltextContentFactory,

VersionedFiles,

VersionedFilesWithFallbacks,

)

# Minimum number of uncompressed bytes to try fetch at once when retrieving

present_keys = []

for prefix in sorted(per_prefix_map):

present_keys.extend(reversed(topo_sort(per_prefix_map[prefix])))

present_keys.extend(reversed(tsort.topo_sort(per_prefix_map[prefix])))

return present_keys

101

108

def __init__(self):

102

109

# map by key? or just order in file?

103

110

self._compressor_name = None

104

self._z_content = None

111

self._z_content_chunks = None

105

112

self._z_content_decompressor = None

106

113

self._z_content_length = None

107

114

self._content_length = None

135

142

self._content = ''.join(self._content_chunks)

136

143

self._content_chunks = None

137

144

if self._content is None:

138

if self._z_content is None:

145

# We join self._z_content_chunks here, because if we are

146

# decompressing, then it is *very* likely that we have a single

147

# chunk

148

if self._z_content_chunks is None:

139

149

raise AssertionError('No content to decompress')

140

if self._z_content == '':

150

z_content = ''.join(self._z_content_chunks)

151

if z_content == '':

141

152

self._content = ''

142

153

elif self._compressor_name == 'lzma':

143

154

# We don't do partial lzma decomp yet

144

self._content = pylzma.decompress(self._z_content)

155

self._content = pylzma.decompress(z_content)

145

156

elif self._compressor_name == 'zlib':

146

157

# Start a zlib decompressor

147

158

if num_bytes * 4 > self._content_length * 3:

148

159

# If we are requesting more that 3/4ths of the content,

149

160

# just extract the whole thing in a single pass

150

161

num_bytes = self._content_length

151

self._content = zlib.decompress(self._z_content)

162

self._content = zlib.decompress(z_content)

152

163

else:

153

164

self._z_content_decompressor = zlib.decompressobj()

154

165

# Seed the decompressor with the uncompressed bytes, so

155

166

# that the rest of the code is simplified

156

167

self._content = self._z_content_decompressor.decompress(

157

self._z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

168

z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

158

169

if not self._z_content_decompressor.unconsumed_tail:

159

170

self._z_content_decompressor = None

160

171

else:

207

218

# XXX: Define some GCCorrupt error ?

208

219

raise AssertionError('Invalid bytes: (%d) != %d + %d' %

209

220

(len(bytes), pos, self._z_content_length))

210

self._z_content = bytes[pos:]

221

self._z_content_chunks = (bytes[pos:],)

222

223

@property

224

def _z_content(self):

225

"""Return z_content_chunks as a simple string.

226

227

Meant only to be used by the test suite.

228

"""

229

if self._z_content_chunks is not None:

230

return ''.join(self._z_content_chunks)

231

return None

211

232

212

233

@classmethod

213

234

def from_bytes(cls, bytes):

269

290

self._content_length = length

270

291

self._content_chunks = content_chunks

271

292

self._content = None

272

self._z_content = None

293

self._z_content_chunks = None

273

294

274

295

def set_content(self, content):

275

296

"""Set the content of this block."""

276

297

self._content_length = len(content)

277

298

self._content = content

278

self._z_content = None

299

self._z_content_chunks = None

279

300

280

301

def _create_z_content_using_lzma(self):

281

302

if self._content_chunks is not None:

283

304

self._content_chunks = None

284

305

if self._content is None:

285

306

raise AssertionError('Nothing to compress')

286

self._z_content = pylzma.compress(self._content)

287

self._z_content_length = len(self._z_content)

307

z_content = pylzma.compress(self._content)

308

self._z_content_chunks = (z_content,)

309

self._z_content_length = len(z_content)

288

310

289

def _create_z_content_from_chunks(self):

311

def _create_z_content_from_chunks(self, chunks):

290

312

compressor = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION)

291

compressed_chunks = map(compressor.compress, self._content_chunks)

313

# Peak in this point is 1 fulltext, 1 compressed text, + zlib overhead

314

# (measured peak is maybe 30MB over the above...)

315

compressed_chunks = map(compressor.compress, chunks)

292

316

compressed_chunks.append(compressor.flush())

293

self._z_content = ''.join(compressed_chunks)

294

self._z_content_length = len(self._z_content)

317

# Ignore empty chunks

318

self._z_content_chunks = [c for c in compressed_chunks if c]

319

self._z_content_length = sum(map(len, self._z_content_chunks))

295

320

296

321

def _create_z_content(self):

297

if self._z_content is not None:

322

if self._z_content_chunks is not None:

298

323

return

299

324

if _USE_LZMA:

300

325

self._create_z_content_using_lzma()

301

326

return

302

327

if self._content_chunks is not None:

303

self._create_z_content_from_chunks()

304

return

305

self._z_content = zlib.compress(self._content)

306

self._z_content_length = len(self._z_content)

328

chunks = self._content_chunks

329

else:

330

chunks = (self._content,)

331

self._create_z_content_from_chunks(chunks)

307

332

308

def to_bytes(self):

309

"""Encode the information into a byte stream."""

333

def to_chunks(self):

334

"""Create the byte stream as a series of 'chunks'"""

310

335

self._create_z_content()

311

336

if _USE_LZMA:

312

337

header = self.GCB_LZ_HEADER

313

338

else:

314

339

header = self.GCB_HEADER

315

chunks = [header,

316

'%d\n%d\n' % (self._z_content_length, self._content_length),

317

self._z_content,

340

chunks = ['%s%d\n%d\n'

341

% (header, self._z_content_length, self._content_length),

318

342

]

343

chunks.extend(self._z_content_chunks)

344

total_len = sum(map(len, chunks))

345

return total_len, chunks

346

347

def to_bytes(self):

348

"""Encode the information into a byte stream."""

349

total_len, chunks = self.to_chunks()

319

350

return ''.join(chunks)

320

351

321

352

def _dump(self, include_text=False):

460

491

_full_enough_block_size = 3*1024*1024 # size at which we won't repack

461

492

_full_enough_mixed_block_size = 2*768*1024 # 1.5MB

462

493

463

def __init__(self, block):

494

def __init__(self, block, get_compressor_settings=None):

464

495

self._block = block

465

496

# We need to preserve the ordering

466

497

self._factories = []

467

498

self._last_byte = 0

499

self._get_settings = get_compressor_settings

500

self._compressor_settings = None

501

502

def _get_compressor_settings(self):

503

if self._compressor_settings is not None:

504

return self._compressor_settings

505

settings = None

506

if self._get_settings is not None:

507

settings = self._get_settings()

508

if settings is None:

509

vf = GroupCompressVersionedFiles

510

settings = vf._DEFAULT_COMPRESSOR_SETTINGS

511

self._compressor_settings = settings

512

return self._compressor_settings

468

513

469

514

def add_factory(self, key, parents, start, end):

470

515

if not self._factories:

503

548

new_block.set_content(self._block._content[:last_byte])

504

549

self._block = new_block

505

550

551

def _make_group_compressor(self):

552

return GroupCompressor(self._get_compressor_settings())

553

506

554

def _rebuild_block(self):

507

555

"""Create a new GroupCompressBlock with only the referenced texts."""

508

compressor = GroupCompressor()

556

compressor = self._make_group_compressor()

509

557

tstart = time.time()

510

558

old_length = self._block._content_length

511

559

end_point = 0

523

571

# block? It seems hard to come up with a method that it would

524

572

# expand, since we do full compression again. Perhaps based on a

525

573

# request that ends up poorly ordered?

574

# TODO: If the content would have expanded, then we would want to

575

# handle a case where we need to split the block.

576

# Now that we have a user-tweakable option

577

# (max_bytes_to_index), it is possible that one person set it

578

# to a very low value, causing poor compression.

526

579

delta = time.time() - tstart

527

580

self._block = new_block

528

581

trace.mutter('creating new compressed block on-the-fly in %.3fs'

679

732

z_header_bytes = zlib.compress(header_bytes)

680

733

del header_bytes

681

734

z_header_bytes_len = len(z_header_bytes)

682

block_bytes = self._block.to_bytes()

735

block_bytes_len, block_chunks = self._block.to_chunks()

683

736

lines.append('%d\n%d\n%d\n' % (z_header_bytes_len, header_bytes_len,

684

len(block_bytes)))

737

block_bytes_len))

685

738

lines.append(z_header_bytes)

686

lines.append(block_bytes)

687

del z_header_bytes, block_bytes

739

lines.extend(block_chunks)

740

del z_header_bytes, block_chunks

741

# TODO: This is a point where we will double the memory consumption. To

742

# avoid this, we probably have to switch to a 'chunked' api

688

743

return ''.join(lines)

689

744

690

745

@classmethod

691

746

def from_bytes(cls, bytes):

692

747

# TODO: This does extra string copying, probably better to do it a

693

# different way

748

# different way. At a minimum this creates 2 copies of the

749

# compressed content

694

750

(storage_kind, z_header_len, header_len,

695

751

block_len, rest) = bytes.split('\n', 4)

696

752

del bytes

854

910

855

911

After calling this, the compressor should no longer be used

856

912

"""

857

# TODO: this causes us to 'bloat' to 2x the size of content in the

858

# group. This has an impact for 'commit' of large objects.

859

# One possibility is to use self._content_chunks, and be lazy and

860

# only fill out self._content as a full string when we actually

861

# need it. That would at least drop the peak memory consumption

862

# for 'commit' down to ~1x the size of the largest file, at a

863

# cost of increased complexity within this code. 2x is still <<

864

# 3x the size of the largest file, so we are doing ok.

865

913

self._block.set_chunked_content(self.chunks, self.endpoint)

866

914

self.chunks = None

867

915

self._delta_index = None

885

933

886

934

class PythonGroupCompressor(_CommonGroupCompressor):

887

935

888

def __init__(self):

936

def __init__(self, max_bytes_to_index=None):

889

937

"""Create a GroupCompressor.

890

938

891

939

Used only if the pyrex version is not available.

944

992

left side.

945

993

"""

946

994

947

def __init__(self):

995

def __init__(self, settings=None):

948

996

super(PyrexGroupCompressor, self).__init__()

949

self._delta_index = DeltaIndex()

997

if settings is None:

998

max_bytes_to_index = \

999

GroupCompressVersionedFiles._DEFAULT_MAX_BYTES_TO_INDEX

1000

else:

1001

(max_bytes_to_index,) = settings

1002

self._delta_index = DeltaIndex(max_bytes_to_index=max_bytes_to_index)

950

1003

951

1004

def _compress(self, key, bytes, max_delta_size, soft=False):

952

1005

"""see _CommonGroupCompressor._compress"""

1027

1080

index = _GCGraphIndex(graph_index, lambda:True, parents=parents,

1028

1081

add_callback=graph_index.add_nodes,

1029

1082

inconsistency_fatal=inconsistency_fatal)

1030

access = knit._DirectPackAccess({})

1083

access = pack_repo._DirectPackAccess({})

1031

1084

access.set_writer(writer, graph_index, (transport, 'newpack'))

1032

1085

result = GroupCompressVersionedFiles(index, access, delta)

1033

1086

result.stream = stream

1043

1096

1044

1097

class _BatchingBlockFetcher(object):

1045

1098

"""Fetch group compress blocks in batches.

1046

1099

1047

1100

:ivar total_bytes: int of expected number of bytes needed to fetch the

1048

1101

currently pending batch.

1049

1102

"""

1050

1103

1051

def __init__(self, gcvf, locations):

1104

def __init__(self, gcvf, locations, get_compressor_settings=None):

1052

1105

self.gcvf = gcvf

1053

1106

self.locations = locations

1054

1107

self.keys = []

1057

1110

self.total_bytes = 0

1058

1111

self.last_read_memo = None

1059

1112

self.manager = None

1113

self._get_compressor_settings = get_compressor_settings

1060

1114

1061

1115

def add_key(self, key):

1062

1116

"""Add another to key to fetch.

1063

1117

1064

1118

:return: The estimated number of bytes needed to fetch the batch so

1065

1119

far.

1066

1120

"""

1091

1145

# and then.

1092

1146

self.batch_memos[read_memo] = cached_block

1093

1147

return self.total_bytes

1094

1148

1095

1149

def _flush_manager(self):

1096

1150

if self.manager is not None:

1097

1151

for factory in self.manager.get_record_stream():

1102

1156

def yield_factories(self, full_flush=False):

1103

1157

"""Yield factories for keys added since the last yield. They will be

1104

1158

returned in the order they were added via add_key.

1105

1159

1106

1160

:param full_flush: by default, some results may not be returned in case

1107

1161

they can be part of the next batch. If full_flush is True, then

1108

1162

all results are returned.

1136

1190

memos_to_get_stack.pop()

1137

1191

else:

1138

1192

block = self.batch_memos[read_memo]

1139

self.manager = _LazyGroupContentManager(block)

1193

self.manager = _LazyGroupContentManager(block,

1194

get_compressor_settings=self._get_compressor_settings)

1140

1195

self.last_read_memo = read_memo

1141

1196

start, end = index_memo[3:5]

1142

1197

self.manager.add_factory(key, parents, start, end)

1149

1204

self.total_bytes = 0

1150

1205

1151

1206

1152

class GroupCompressVersionedFiles(VersionedFiles):

1207

class GroupCompressVersionedFiles(VersionedFilesWithFallbacks):

1153

1208

"""A group-compress based VersionedFiles implementation."""

1154

1209

1155

def __init__(self, index, access, delta=True, _unadded_refs=None):

1210

# This controls how the GroupCompress DeltaIndex works. Basically, we

1211

# compute hash pointers into the source blocks (so hash(text) => text).

1212

# However each of these references costs some memory in trade against a

1213

# more accurate match result. For very large files, they either are

1214

# pre-compressed and change in bulk whenever they change, or change in just

1215

# local blocks. Either way, 'improved resolution' is not very helpful,

1216

# versus running out of memory trying to track everything. The default max

1217

# gives 100% sampling of a 1MB file.

1218

_DEFAULT_MAX_BYTES_TO_INDEX = 1024 * 1024

1219

_DEFAULT_COMPRESSOR_SETTINGS = (_DEFAULT_MAX_BYTES_TO_INDEX,)

1220

1221

def __init__(self, index, access, delta=True, _unadded_refs=None,

1222

_group_cache=None):

1156

1223

"""Create a GroupCompressVersionedFiles object.

1157

1224

1158

1225

:param index: The index object storing access and graph data.

1159

1226

:param access: The access object storing raw data.

1160

1227

:param delta: Whether to delta compress or just entropy compress.

1161

1228

:param _unadded_refs: private parameter, don't use.

1229

:param _group_cache: private parameter, don't use.

1162

1230

"""

1163

1231

self._index = index

1164

1232

self._access = access

1166

1234

if _unadded_refs is None:

1167

1235

_unadded_refs = {}

1168

1236

self._unadded_refs = _unadded_refs

1169

self._group_cache = LRUSizeCache(max_size=50*1024*1024)

1170

self._fallback_vfs = []

1237

if _group_cache is None:

1238

_group_cache = LRUSizeCache(max_size=50*1024*1024)

1239

self._group_cache = _group_cache

1240

self._immediate_fallback_vfs = []

1241

self._max_bytes_to_index = None

1171

1242

1172

1243

def without_fallbacks(self):

1173

1244

"""Return a clone of this object without any fallbacks configured."""

1174

1245

return GroupCompressVersionedFiles(self._index, self._access,

1175

self._delta, _unadded_refs=dict(self._unadded_refs))

1246

self._delta, _unadded_refs=dict(self._unadded_refs),

1247

_group_cache=self._group_cache)

1176

1248

1177

1249

def add_lines(self, key, parents, lines, parent_texts=None,

1178

1250

left_matching_blocks=None, nostore_sha=None, random_id=False,

1247

1319

1248

1320

:param a_versioned_files: A VersionedFiles object.

1249

1321

"""

1250

self._fallback_vfs.append(a_versioned_files)

1322

self._immediate_fallback_vfs.append(a_versioned_files)

1251

1323

1252

1324

def annotate(self, key):

1253

1325

"""See VersionedFiles.annotate."""

1293

1365

# KnitVersionedFiles.get_known_graph_ancestry, but they don't share

1294

1366

# ancestry.

1295

1367

parent_map, missing_keys = self._index.find_ancestry(keys)

1296

for fallback in self._fallback_vfs:

1368

for fallback in self._transitive_fallbacks():

1297

1369

if not missing_keys:

1298

1370

break

1299

1371

(f_parent_map, f_missing_keys) = fallback._index.find_ancestry(

1323

1395

and so on.

1324

1396

"""

1325

1397

result = {}

1326

sources = [self._index] + self._fallback_vfs

1398

sources = [self._index] + self._immediate_fallback_vfs

1327

1399

source_results = []

1328

1400

missing = set(keys)

1329

1401

for source in sources:

1430

1502

parent_map = {}

1431

1503

key_to_source_map = {}

1432

1504

source_results = []

1433

for source in self._fallback_vfs:

1505

for source in self._immediate_fallback_vfs:

1434

1506

if not missing:

1435

1507

break

1436

1508

source_parents = source.get_parent_map(missing)

1451

1523

the defined order, regardless of source.

1452

1524

"""

1453

1525

if ordering == 'topological':

1454

present_keys = topo_sort(parent_map)

1526

present_keys = tsort.topo_sort(parent_map)

1455

1527

else:

1456

1528

# ordering == 'groupcompress'

1457

1529

# XXX: This only optimizes for the target ordering. We may need

1546

1618

# - we encounter an unadded ref, or

1547

1619

# - we run out of keys, or

1548

1620

# - the total bytes to retrieve for this batch > BATCH_SIZE

1549

batcher = _BatchingBlockFetcher(self, locations)

1621

batcher = _BatchingBlockFetcher(self, locations,

1622

get_compressor_settings=self._get_compressor_settings)

1550

1623

for source, keys in source_keys:

1551

1624

if source is self:

1552

1625

for key in keys:

1598

1671

for _ in self._insert_record_stream(stream, random_id=False):

1599

1672

pass

1600

1673

1674

def _get_compressor_settings(self):

1675

if self._max_bytes_to_index is None:

1676

# TODO: VersionedFiles don't know about their containing

1677

# repository, so they don't have much of an idea about their

1678

# location. So for now, this is only a global option.

1679

c = config.GlobalConfig()

1680

val = c.get_user_option('bzr.groupcompress.max_bytes_to_index')

1681

if val is not None:

1682

try:

1683

val = int(val)

1684

except ValueError, e:

1685

trace.warning('Value for '

1686

'"bzr.groupcompress.max_bytes_to_index"'

1687

' %r is not an integer'

1688

% (val,))

1689

val = None

1690

if val is None:

1691

val = self._DEFAULT_MAX_BYTES_TO_INDEX

1692

self._max_bytes_to_index = val

1693

return (self._max_bytes_to_index,)

1694

1695

def _make_group_compressor(self):

1696

return GroupCompressor(self._get_compressor_settings())

1697

1601

1698

def _insert_record_stream(self, stream, random_id=False, nostore_sha=None,

1602

1699

reuse_blocks=True):

1603

1700

"""Internal core to insert a record stream into this container.

1626

1723

return adapter

1627

1724

# This will go up to fulltexts for gc to gc fetching, which isn't

1628

1725

# ideal.

1629

self._compressor = GroupCompressor()

1726

self._compressor = self._make_group_compressor()

1630

1727

self._unadded_refs = {}

1631

1728

keys_to_add = []

1632

1729

def flush():

1633

bytes = self._compressor.flush().to_bytes()

1634

self._compressor = GroupCompressor()

1730

bytes_len, chunks = self._compressor.flush().to_chunks()

1731

self._compressor = self._make_group_compressor()

1732

# Note: At this point we still have 1 copy of the fulltext (in

1733

# record and the var 'bytes'), and this generates 2 copies of

1734

# the compressed text (one for bytes, one in chunks)

1735

# TODO: Push 'chunks' down into the _access api, so that we don't

1736

# have to double compressed memory here

1737

# TODO: Figure out how to indicate that we would be happy to free

1738

# the fulltext content at this point. Note that sometimes we

1739

# will want it later (streaming CHK pages), but most of the

1740

# time we won't (everything else)

1741

bytes = ''.join(chunks)

1742

del chunks

1635

1743

index, start, length = self._access.add_raw_records(

1636

1744

[(None, len(bytes))], bytes)[0]

1637

1745

nodes = []

1802

1910

"""See VersionedFiles.keys."""

1803

1911

if 'evil' in debug.debug_flags:

1804

1912

trace.mutter_callsite(2, "keys scales with size of history")

1805

sources = [self._index] + self._fallback_vfs

1913

sources = [self._index] + self._immediate_fallback_vfs

1806

1914

result = set()

1807

1915

for source in sources:

1808

1916

result.update(source.keys())

1809

1917

return result

1810

1918

1811

1919

1920

class _GCBuildDetails(object):

1921

"""A blob of data about the build details.

1922

1923

This stores the minimal data, which then allows compatibility with the old

1924

api, without taking as much memory.

1925

"""

1926

1927

__slots__ = ('_index', '_group_start', '_group_end', '_basis_end',

1928

'_delta_end', '_parents')

1929

1930

method = 'group'

1931

compression_parent = None

1932

1933

def __init__(self, parents, position_info):

1934

self._parents = parents

1935

(self._index, self._group_start, self._group_end, self._basis_end,

1936

self._delta_end) = position_info

1937

1938

def __repr__(self):

1939

return '%s(%s, %s)' % (self.__class__.__name__,

1940

self.index_memo, self._parents)

1941

1942

@property

1943

def index_memo(self):

1944

return (self._index, self._group_start, self._group_end,

1945

self._basis_end, self._delta_end)

1946

1947

@property

1948

def record_details(self):

1949

return static_tuple.StaticTuple(self.method, None)

1950

1951

def __getitem__(self, offset):

1952

"""Compatibility thunk to act like a tuple."""

1953

if offset == 0:

1954

return self.index_memo

1955

elif offset == 1:

1956

return self.compression_parent # Always None

1957

elif offset == 2:

1958

return self._parents

1959

elif offset == 3:

1960

return self.record_details

1961

else:

1962

raise IndexError('offset out of range')

1963

1964

def __len__(self):

1965

return 4

1966

1967

1812

1968

class _GCGraphIndex(object):

1813

1969

"""Mapper from GroupCompressVersionedFiles needs into GraphIndex storage."""

1814

1970

1843

1999

# repeated over and over, this creates a surplus of ints

1844

2000

self._int_cache = {}

1845

2001

if track_external_parent_refs:

1846

self._key_dependencies = knit._KeyRefs(

2002

self._key_dependencies = _KeyRefs(

1847

2003

track_new_keys=track_new_keys)

1848

2004

else:

1849

2005

self._key_dependencies = None

2009

2165

parents = None

2010

2166

else:

2011

2167

parents = entry[3][0]

2012

method = 'group'

2013

result[key] = (self._node_to_position(entry),

2014

None, parents, (method, None))

2168

details = _GCBuildDetails(parents, self._node_to_position(entry))

2169

result[key] = details

2015

2170

return result

2016

2171

2017

2172

def keys(self):

2033

2188

# each, or about 7MB. Note that it might be even more when you consider

2034

2189

# how PyInt is allocated in separate slabs. And you can't return a slab

2035

2190

# to the OS if even 1 int on it is in use. Note though that Python uses

2036

# a LIFO when re-using PyInt slots, which probably causes more

2191

# a LIFO when re-using PyInt slots, which might cause more

2037

2192

# fragmentation.

2038

2193

start = int(bits[0])

2039

2194

start = self._int_cache.setdefault(start, start)

Older »