/brz/remove-bazaar : revision 5892

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: Canonical.com Patch Queue Manager
Date: 2011-05-18 16:11:05 UTC
mfrom: (5074.5.9 fix523746)
Revision ID: pqm@pqm.ubuntu.com-20110518161105-pbt4yc8mgl0y3qsy

(mbp) better handling of subprocesses with non-ascii encodings and filenames
(bug 523746) (INADA Naoki)

files added:
NEWS

bzrlib/cethread.py

bzrlib/cmd_test_script.py

bzrlib/controldir.py

bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/export_pot.py

bzrlib/library_state.py

bzrlib/mergetools.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/pyutils.py

bzrlib/recordcounter.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_remember_option.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/fixtures.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_repository/test_file_graph.py

bzrlib/tests/per_repository_reference/test__make_parents_provider.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_repository_vf/test_write_group.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/scenarios.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_utextwrap.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/testui.py

bzrlib/transport/gio_transport.py

bzrlib/utextwrap.py

bzrlib/vf_repository.py

bzrlib/workingtree_3.py

contrib/bash/bzr

contrib/zsh/README

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/configuration.txt

doc/developers/documenting-changes.txt

doc/developers/fetch.txt

doc/developers/transports.txt

doc/developers/ui.txt

doc/developers/xdg_config_spec.txt

doc/en/admin-guide/licence.txt

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/series-template.txt

doc/en/tutorials/licence.txt

doc/en/upgrade-guide/licence.txt

doc/en/user-guide/licence.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/en/whats-new/whats-new-in-2.4.txt

tools/build_mo.py

tools/fixed-in.py

tools/msgfmt.py

tools/win32/py2exe_boot_common.py

files removed:
bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/deprecated_graph.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/util/bencode.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

tools/convertfile.py

tools/convertinv.py

tools/trace-revisions

tools/weavebench.py

files renamed:
bzrlib/doc_generate/sphinx_conf.py => bzrlib/doc_generate/conf.py

bzrlib/repofmt/weaverepo.py => bzrlib/plugins/weave_fmt/repository.py

bzrlib/xml4.py => bzrlib/plugins/weave_fmt/xml4.py

bzrlib/tests/per_bzrdir/ => bzrlib/tests/per_controldir/

bzrlib/tests/per_bzrdir/test_bzrdir.py => bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_bzrdir_colo/ => bzrlib/tests/per_controldir_colo/

bzrlib/tests/per_repository/test_is_write_locked.py => bzrlib/tests/per_repository/test_locking.py

bzrlib/tests/per_repository/helpers.py => bzrlib/tests/per_repository_vf/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py => bzrlib/tests/per_repository_vf/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py => bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check_reconcile.py => bzrlib/tests/per_repository_vf/test_check_reconcile.py

bzrlib/tests/per_repository/test_find_text_key_references.py => bzrlib/tests/per_repository_vf/test_find_text_key_references.py

NEWS => doc/en/release-notes/bzr-2.3.txt

NEWS-template.txt => doc/en/release-notes/release-template.txt

files modified:
.bzrignore

.testr.conf

INSTALL

Makefile

README

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/crash.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/news_merge/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/status.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/features.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_controldir_colo/__init__.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/pathfilter.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/util/configobj/configobj.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates/index.html

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference/readme.txt

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial/index.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/index.txt

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-reference/index.txt

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial/index.txt

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/introducing_bazaar.txt

profile_imports.py

setup.py

tools/check-newsbugs.py

tools/generate_release_notes.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/buildout.cfg

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

except ImportError:

pylzma = None

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

annotate,

config,

debug,

errors,

graph as _mod_graph,

knit,

osutils,

pack,

static_tuple,

trace,

tsort,

)

from bzrlib.repofmt import pack_repo

""")

from bzrlib.btree_index import BTreeBuilder

from bzrlib.lru_cache import LRUSizeCache

from bzrlib.tsort import topo_sort

from bzrlib.versionedfile import (

_KeyRefs,

adapter_registry,

AbsentContentFactory,

ChunkedContentFactory,

FulltextContentFactory,

VersionedFiles,

VersionedFilesWithFallbacks,

)

# Minimum number of uncompressed bytes to try fetch at once when retrieving

present_keys = []

for prefix in sorted(per_prefix_map):

present_keys.extend(reversed(topo_sort(per_prefix_map[prefix])))

present_keys.extend(reversed(tsort.topo_sort(per_prefix_map[prefix])))

return present_keys

101

108

def __init__(self):

102

109

# map by key? or just order in file?

103

110

self._compressor_name = None

104

self._z_content = None

111

self._z_content_chunks = None

105

112

self._z_content_decompressor = None

106

113

self._z_content_length = None

107

114

self._content_length = None

135

142

self._content = ''.join(self._content_chunks)

136

143

self._content_chunks = None

137

144

if self._content is None:

138

if self._z_content is None:

145

# We join self._z_content_chunks here, because if we are

146

# decompressing, then it is *very* likely that we have a single

147

# chunk

148

if self._z_content_chunks is None:

139

149

raise AssertionError('No content to decompress')

140

if self._z_content == '':

150

z_content = ''.join(self._z_content_chunks)

151

if z_content == '':

141

152

self._content = ''

142

153

elif self._compressor_name == 'lzma':

143

154

# We don't do partial lzma decomp yet

144

self._content = pylzma.decompress(self._z_content)

155

self._content = pylzma.decompress(z_content)

145

156

elif self._compressor_name == 'zlib':

146

157

# Start a zlib decompressor

147

158

if num_bytes * 4 > self._content_length * 3:

148

159

# If we are requesting more that 3/4ths of the content,

149

160

# just extract the whole thing in a single pass

150

161

num_bytes = self._content_length

151

self._content = zlib.decompress(self._z_content)

162

self._content = zlib.decompress(z_content)

152

163

else:

153

164

self._z_content_decompressor = zlib.decompressobj()

154

165

# Seed the decompressor with the uncompressed bytes, so

155

166

# that the rest of the code is simplified

156

167

self._content = self._z_content_decompressor.decompress(

157

self._z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

168

z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

158

169

if not self._z_content_decompressor.unconsumed_tail:

159

170

self._z_content_decompressor = None

160

171

else:

207

218

# XXX: Define some GCCorrupt error ?

208

219

raise AssertionError('Invalid bytes: (%d) != %d + %d' %

209

220

(len(bytes), pos, self._z_content_length))

210

self._z_content = bytes[pos:]

221

self._z_content_chunks = (bytes[pos:],)

222

223

@property

224

def _z_content(self):

225

"""Return z_content_chunks as a simple string.

226

227

Meant only to be used by the test suite.

228

"""

229

if self._z_content_chunks is not None:

230

return ''.join(self._z_content_chunks)

231

return None

211

232

212

233

@classmethod

213

234

def from_bytes(cls, bytes):

269

290

self._content_length = length

270

291

self._content_chunks = content_chunks

271

292

self._content = None

272

self._z_content = None

293

self._z_content_chunks = None

273

294

274

295

def set_content(self, content):

275

296

"""Set the content of this block."""

276

297

self._content_length = len(content)

277

298

self._content = content

278

self._z_content = None

299

self._z_content_chunks = None

279

300

280

301

def _create_z_content_using_lzma(self):

281

302

if self._content_chunks is not None:

283

304

self._content_chunks = None

284

305

if self._content is None:

285

306

raise AssertionError('Nothing to compress')

286

self._z_content = pylzma.compress(self._content)

287

self._z_content_length = len(self._z_content)

307

z_content = pylzma.compress(self._content)

308

self._z_content_chunks = (z_content,)

309

self._z_content_length = len(z_content)

288

310

289

def _create_z_content_from_chunks(self):

311

def _create_z_content_from_chunks(self, chunks):

290

312

compressor = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION)

291

compressed_chunks = map(compressor.compress, self._content_chunks)

313

# Peak in this point is 1 fulltext, 1 compressed text, + zlib overhead

314

# (measured peak is maybe 30MB over the above...)

315

compressed_chunks = map(compressor.compress, chunks)

292

316

compressed_chunks.append(compressor.flush())

293

self._z_content = ''.join(compressed_chunks)

294

self._z_content_length = len(self._z_content)

317

# Ignore empty chunks

318

self._z_content_chunks = [c for c in compressed_chunks if c]

319

self._z_content_length = sum(map(len, self._z_content_chunks))

295

320

296

321

def _create_z_content(self):

297

if self._z_content is not None:

322

if self._z_content_chunks is not None:

298

323

return

299

324

if _USE_LZMA:

300

325

self._create_z_content_using_lzma()

301

326

return

302

327

if self._content_chunks is not None:

303

self._create_z_content_from_chunks()

304

return

305

self._z_content = zlib.compress(self._content)

306

self._z_content_length = len(self._z_content)

328

chunks = self._content_chunks

329

else:

330

chunks = (self._content,)

331

self._create_z_content_from_chunks(chunks)

307

332

308

def to_bytes(self):

309

"""Encode the information into a byte stream."""

333

def to_chunks(self):

334

"""Create the byte stream as a series of 'chunks'"""

310

335

self._create_z_content()

311

336

if _USE_LZMA:

312

337

header = self.GCB_LZ_HEADER

313

338

else:

314

339

header = self.GCB_HEADER

315

chunks = [header,

316

'%d\n%d\n' % (self._z_content_length, self._content_length),

317

self._z_content,

340

chunks = ['%s%d\n%d\n'

341

% (header, self._z_content_length, self._content_length),

318

342

]

343

chunks.extend(self._z_content_chunks)

344

total_len = sum(map(len, chunks))

345

return total_len, chunks

346

347

def to_bytes(self):

348

"""Encode the information into a byte stream."""

349

total_len, chunks = self.to_chunks()

319

350

return ''.join(chunks)

320

351

321

352

def _dump(self, include_text=False):

460

491

_full_enough_block_size = 3*1024*1024 # size at which we won't repack

461

492

_full_enough_mixed_block_size = 2*768*1024 # 1.5MB

462

493

463

def __init__(self, block):

494

def __init__(self, block, get_compressor_settings=None):

464

495

self._block = block

465

496

# We need to preserve the ordering

466

497

self._factories = []

467

498

self._last_byte = 0

499

self._get_settings = get_compressor_settings

500

self._compressor_settings = None

501

502

def _get_compressor_settings(self):

503

if self._compressor_settings is not None:

504

return self._compressor_settings

505

settings = None

506

if self._get_settings is not None:

507

settings = self._get_settings()

508

if settings is None:

509

vf = GroupCompressVersionedFiles

510

settings = vf._DEFAULT_COMPRESSOR_SETTINGS

511

self._compressor_settings = settings

512

return self._compressor_settings

468

513

469

514

def add_factory(self, key, parents, start, end):

470

515

if not self._factories:

503

548

new_block.set_content(self._block._content[:last_byte])

504

549

self._block = new_block

505

550

551

def _make_group_compressor(self):

552

return GroupCompressor(self._get_compressor_settings())

553

506

554

def _rebuild_block(self):

507

555

"""Create a new GroupCompressBlock with only the referenced texts."""

508

compressor = GroupCompressor()

556

compressor = self._make_group_compressor()

509

557

tstart = time.time()

510

558

old_length = self._block._content_length

511

559

end_point = 0

523

571

# block? It seems hard to come up with a method that it would

524

572

# expand, since we do full compression again. Perhaps based on a

525

573

# request that ends up poorly ordered?

574

# TODO: If the content would have expanded, then we would want to

575

# handle a case where we need to split the block.

576

# Now that we have a user-tweakable option

577

# (max_bytes_to_index), it is possible that one person set it

578

# to a very low value, causing poor compression.

526

579

delta = time.time() - tstart

527

580

self._block = new_block

528

581

trace.mutter('creating new compressed block on-the-fly in %.3fs'

679

732

z_header_bytes = zlib.compress(header_bytes)

680

733

del header_bytes

681

734

z_header_bytes_len = len(z_header_bytes)

682

block_bytes = self._block.to_bytes()

735

block_bytes_len, block_chunks = self._block.to_chunks()

683

736

lines.append('%d\n%d\n%d\n' % (z_header_bytes_len, header_bytes_len,

684

len(block_bytes)))

737

block_bytes_len))

685

738

lines.append(z_header_bytes)

686

lines.append(block_bytes)

687

del z_header_bytes, block_bytes

739

lines.extend(block_chunks)

740

del z_header_bytes, block_chunks

741

# TODO: This is a point where we will double the memory consumption. To

742

# avoid this, we probably have to switch to a 'chunked' api

688

743

return ''.join(lines)

689

744

690

745

@classmethod

691

746

def from_bytes(cls, bytes):

692

747

# TODO: This does extra string copying, probably better to do it a

693

# different way

748

# different way. At a minimum this creates 2 copies of the

749

# compressed content

694

750

(storage_kind, z_header_len, header_len,

695

751

block_len, rest) = bytes.split('\n', 4)

696

752

del bytes

748

804

749

805

class _CommonGroupCompressor(object):

750

806

751

def __init__(self):

807

def __init__(self, settings=None):

752

808

"""Create a GroupCompressor."""

753

809

self.chunks = []

754

810

self._last = None

757

813

self.labels_deltas = {}

758

814

self._delta_index = None # Set by the children

759

815

self._block = GroupCompressBlock()

816

if settings is None:

817

self._settings = {}

818

else:

819

self._settings = settings

760

820

761

821

def compress(self, key, bytes, expected_sha, nostore_sha=None, soft=False):

762

822

"""Compress lines with label key.

854

914

855

915

After calling this, the compressor should no longer be used

856

916

"""

857

# TODO: this causes us to 'bloat' to 2x the size of content in the

858

# group. This has an impact for 'commit' of large objects.

859

# One possibility is to use self._content_chunks, and be lazy and

860

# only fill out self._content as a full string when we actually

861

# need it. That would at least drop the peak memory consumption

862

# for 'commit' down to ~1x the size of the largest file, at a

863

# cost of increased complexity within this code. 2x is still <<

864

# 3x the size of the largest file, so we are doing ok.

865

917

self._block.set_chunked_content(self.chunks, self.endpoint)

866

918

self.chunks = None

867

919

self._delta_index = None

885

937

886

938

class PythonGroupCompressor(_CommonGroupCompressor):

887

939

888

def __init__(self):

940

def __init__(self, settings=None):

889

941

"""Create a GroupCompressor.

890

942

891

943

Used only if the pyrex version is not available.

892

944

"""

893

super(PythonGroupCompressor, self).__init__()

945

super(PythonGroupCompressor, self).__init__(settings)

894

946

self._delta_index = LinesDeltaIndex([])

895

947

# The actual content is managed by LinesDeltaIndex

896

948

self.chunks = self._delta_index.lines

944

996

left side.

945

997

"""

946

998

947

def __init__(self):

948

super(PyrexGroupCompressor, self).__init__()

949

self._delta_index = DeltaIndex()

999

def __init__(self, settings=None):

1000

super(PyrexGroupCompressor, self).__init__(settings)

1001

max_bytes_to_index = self._settings.get('max_bytes_to_index', 0)

1002

self._delta_index = DeltaIndex(max_bytes_to_index=max_bytes_to_index)

950

1003

951

1004

def _compress(self, key, bytes, max_delta_size, soft=False):

952

1005

"""see _CommonGroupCompressor._compress"""

1027

1080

index = _GCGraphIndex(graph_index, lambda:True, parents=parents,

1028

1081

add_callback=graph_index.add_nodes,

1029

1082

inconsistency_fatal=inconsistency_fatal)

1030

access = knit._DirectPackAccess({})

1083

access = pack_repo._DirectPackAccess({})

1031

1084

access.set_writer(writer, graph_index, (transport, 'newpack'))

1032

1085

result = GroupCompressVersionedFiles(index, access, delta)

1033

1086

result.stream = stream

1043

1096

1044

1097

class _BatchingBlockFetcher(object):

1045

1098

"""Fetch group compress blocks in batches.

1046

1099

1047

1100

:ivar total_bytes: int of expected number of bytes needed to fetch the

1048

1101

currently pending batch.

1049

1102

"""

1050

1103

1051

def __init__(self, gcvf, locations):

1104

def __init__(self, gcvf, locations, get_compressor_settings=None):

1052

1105

self.gcvf = gcvf

1053

1106

self.locations = locations

1054

1107

self.keys = []

1057

1110

self.total_bytes = 0

1058

1111

self.last_read_memo = None

1059

1112

self.manager = None

1113

self._get_compressor_settings = get_compressor_settings

1060

1114

1061

1115

def add_key(self, key):

1062

1116

"""Add another to key to fetch.

1063

1117

1064

1118

:return: The estimated number of bytes needed to fetch the batch so

1065

1119

far.

1066

1120

"""

1091

1145

# and then.

1092

1146

self.batch_memos[read_memo] = cached_block

1093

1147

return self.total_bytes

1094

1148

1095

1149

def _flush_manager(self):

1096

1150

if self.manager is not None:

1097

1151

for factory in self.manager.get_record_stream():

1102

1156

def yield_factories(self, full_flush=False):

1103

1157

"""Yield factories for keys added since the last yield. They will be

1104

1158

returned in the order they were added via add_key.

1105

1159

1106

1160

:param full_flush: by default, some results may not be returned in case

1107

1161

they can be part of the next batch. If full_flush is True, then

1108

1162

all results are returned.

1136

1190

memos_to_get_stack.pop()

1137

1191

else:

1138

1192

block = self.batch_memos[read_memo]

1139

self.manager = _LazyGroupContentManager(block)

1193

self.manager = _LazyGroupContentManager(block,

1194

get_compressor_settings=self._get_compressor_settings)

1140

1195

self.last_read_memo = read_memo

1141

1196

start, end = index_memo[3:5]

1142

1197

self.manager.add_factory(key, parents, start, end)

1149

1204

self.total_bytes = 0

1150

1205

1151

1206

1152

class GroupCompressVersionedFiles(VersionedFiles):

1207

class GroupCompressVersionedFiles(VersionedFilesWithFallbacks):

1153

1208

"""A group-compress based VersionedFiles implementation."""

1154

1209

1155

def __init__(self, index, access, delta=True, _unadded_refs=None):

1210

# This controls how the GroupCompress DeltaIndex works. Basically, we

1211

# compute hash pointers into the source blocks (so hash(text) => text).

1212

# However each of these references costs some memory in trade against a

1213

# more accurate match result. For very large files, they either are

1214

# pre-compressed and change in bulk whenever they change, or change in just

1215

# local blocks. Either way, 'improved resolution' is not very helpful,

1216

# versus running out of memory trying to track everything. The default max

1217

# gives 100% sampling of a 1MB file.

1218

_DEFAULT_MAX_BYTES_TO_INDEX = 1024 * 1024

1219

_DEFAULT_COMPRESSOR_SETTINGS = {'max_bytes_to_index':

1220

_DEFAULT_MAX_BYTES_TO_INDEX}

1221

1222

def __init__(self, index, access, delta=True, _unadded_refs=None,

1223

_group_cache=None):

1156

1224

"""Create a GroupCompressVersionedFiles object.

1157

1225

1158

1226

:param index: The index object storing access and graph data.

1159

1227

:param access: The access object storing raw data.

1160

1228

:param delta: Whether to delta compress or just entropy compress.

1161

1229

:param _unadded_refs: private parameter, don't use.

1230

:param _group_cache: private parameter, don't use.

1162

1231

"""

1163

1232

self._index = index

1164

1233

self._access = access

1166

1235

if _unadded_refs is None:

1167

1236

_unadded_refs = {}

1168

1237

self._unadded_refs = _unadded_refs

1169

self._group_cache = LRUSizeCache(max_size=50*1024*1024)

1170

self._fallback_vfs = []

1238

if _group_cache is None:

1239

_group_cache = LRUSizeCache(max_size=50*1024*1024)

1240

self._group_cache = _group_cache

1241

self._immediate_fallback_vfs = []

1242

self._max_bytes_to_index = None

1171

1243

1172

1244

def without_fallbacks(self):

1173

1245

"""Return a clone of this object without any fallbacks configured."""

1174

1246

return GroupCompressVersionedFiles(self._index, self._access,

1175

self._delta, _unadded_refs=dict(self._unadded_refs))

1247

self._delta, _unadded_refs=dict(self._unadded_refs),

1248

_group_cache=self._group_cache)

1176

1249

1177

1250

def add_lines(self, key, parents, lines, parent_texts=None,

1178

1251

left_matching_blocks=None, nostore_sha=None, random_id=False,

1247

1320

1248

1321

:param a_versioned_files: A VersionedFiles object.

1249

1322

"""

1250

self._fallback_vfs.append(a_versioned_files)

1323

self._immediate_fallback_vfs.append(a_versioned_files)

1251

1324

1252

1325

def annotate(self, key):

1253

1326

"""See VersionedFiles.annotate."""

1287

1360

self._check_lines_not_unicode(lines)

1288

1361

self._check_lines_are_lines(lines)

1289

1362

1290

def get_known_graph_ancestry(self, keys):

1291

"""Get a KnownGraph instance with the ancestry of keys."""

1292

# Note that this is identical to

1293

# KnitVersionedFiles.get_known_graph_ancestry, but they don't share

1294

# ancestry.

1295

parent_map, missing_keys = self._index.find_ancestry(keys)

1296

for fallback in self._fallback_vfs:

1297

if not missing_keys:

1298

break

1299

(f_parent_map, f_missing_keys) = fallback._index.find_ancestry(

1300

missing_keys)

1301

parent_map.update(f_parent_map)

1302

missing_keys = f_missing_keys

1303

kg = _mod_graph.KnownGraph(parent_map)

1304

return kg

1305

1306

1363

def get_parent_map(self, keys):

1307

1364

"""Get a map of the graph parents of keys.

1308

1365

1323

1380

and so on.

1324

1381

"""

1325

1382

result = {}

1326

sources = [self._index] + self._fallback_vfs

1383

sources = [self._index] + self._immediate_fallback_vfs

1327

1384

source_results = []

1328

1385

missing = set(keys)

1329

1386

for source in sources:

1430

1487

parent_map = {}

1431

1488

key_to_source_map = {}

1432

1489

source_results = []

1433

for source in self._fallback_vfs:

1490

for source in self._immediate_fallback_vfs:

1434

1491

if not missing:

1435

1492

break

1436

1493

source_parents = source.get_parent_map(missing)

1451

1508

the defined order, regardless of source.

1452

1509

"""

1453

1510

if ordering == 'topological':

1454

present_keys = topo_sort(parent_map)

1511

present_keys = tsort.topo_sort(parent_map)

1455

1512

else:

1456

1513

# ordering == 'groupcompress'

1457

1514

# XXX: This only optimizes for the target ordering. We may need

1546

1603

# - we encounter an unadded ref, or

1547

1604

# - we run out of keys, or

1548

1605

# - the total bytes to retrieve for this batch > BATCH_SIZE

1549

batcher = _BatchingBlockFetcher(self, locations)

1606

batcher = _BatchingBlockFetcher(self, locations,

1607

get_compressor_settings=self._get_compressor_settings)

1550

1608

for source, keys in source_keys:

1551

1609

if source is self:

1552

1610

for key in keys:

1598

1656

for _ in self._insert_record_stream(stream, random_id=False):

1599

1657

pass

1600

1658

1659

def _get_compressor_settings(self):

1660

if self._max_bytes_to_index is None:

1661

# TODO: VersionedFiles don't know about their containing

1662

# repository, so they don't have much of an idea about their

1663

# location. So for now, this is only a global option.

1664

c = config.GlobalConfig()

1665

val = c.get_user_option('bzr.groupcompress.max_bytes_to_index')

1666

if val is not None:

1667

try:

1668

val = int(val)

1669

except ValueError, e:

1670

trace.warning('Value for '

1671

'"bzr.groupcompress.max_bytes_to_index"'

1672

' %r is not an integer'

1673

% (val,))

1674

val = None

1675

if val is None:

1676

val = self._DEFAULT_MAX_BYTES_TO_INDEX

1677

self._max_bytes_to_index = val

1678

return {'max_bytes_to_index': self._max_bytes_to_index}

1679

1680

def _make_group_compressor(self):

1681

return GroupCompressor(self._get_compressor_settings())

1682

1601

1683

def _insert_record_stream(self, stream, random_id=False, nostore_sha=None,

1602

1684

reuse_blocks=True):

1603

1685

"""Internal core to insert a record stream into this container.

1626

1708

return adapter

1627

1709

# This will go up to fulltexts for gc to gc fetching, which isn't

1628

1710

# ideal.

1629

self._compressor = GroupCompressor()

1711

self._compressor = self._make_group_compressor()

1630

1712

self._unadded_refs = {}

1631

1713

keys_to_add = []

1632

1714

def flush():

1633

bytes = self._compressor.flush().to_bytes()

1634

self._compressor = GroupCompressor()

1715

bytes_len, chunks = self._compressor.flush().to_chunks()

1716

self._compressor = self._make_group_compressor()

1717

# Note: At this point we still have 1 copy of the fulltext (in

1718

# record and the var 'bytes'), and this generates 2 copies of

1719

# the compressed text (one for bytes, one in chunks)

1720

# TODO: Push 'chunks' down into the _access api, so that we don't

1721

# have to double compressed memory here

1722

# TODO: Figure out how to indicate that we would be happy to free

1723

# the fulltext content at this point. Note that sometimes we

1724

# will want it later (streaming CHK pages), but most of the

1725

# time we won't (everything else)

1726

bytes = ''.join(chunks)

1727

del chunks

1635

1728

index, start, length = self._access.add_raw_records(

1636

1729

[(None, len(bytes))], bytes)[0]

1637

1730

nodes = []

1802

1895

"""See VersionedFiles.keys."""

1803

1896

if 'evil' in debug.debug_flags:

1804

1897

trace.mutter_callsite(2, "keys scales with size of history")

1805

sources = [self._index] + self._fallback_vfs

1898

sources = [self._index] + self._immediate_fallback_vfs

1806

1899

result = set()

1807

1900

for source in sources:

1808

1901

result.update(source.keys())

1809

1902

return result

1810

1903

1811

1904

1905

class _GCBuildDetails(object):

1906

"""A blob of data about the build details.

1907

1908

This stores the minimal data, which then allows compatibility with the old

1909

api, without taking as much memory.

1910

"""

1911

1912

__slots__ = ('_index', '_group_start', '_group_end', '_basis_end',

1913

'_delta_end', '_parents')

1914

1915

method = 'group'

1916

compression_parent = None

1917

1918

def __init__(self, parents, position_info):

1919

self._parents = parents

1920

(self._index, self._group_start, self._group_end, self._basis_end,

1921

self._delta_end) = position_info

1922

1923

def __repr__(self):

1924

return '%s(%s, %s)' % (self.__class__.__name__,

1925

self.index_memo, self._parents)

1926

1927

@property

1928

def index_memo(self):

1929

return (self._index, self._group_start, self._group_end,

1930

self._basis_end, self._delta_end)

1931

1932

@property

1933

def record_details(self):

1934

return static_tuple.StaticTuple(self.method, None)

1935

1936

def __getitem__(self, offset):

1937

"""Compatibility thunk to act like a tuple."""

1938

if offset == 0:

1939

return self.index_memo

1940

elif offset == 1:

1941

return self.compression_parent # Always None

1942

elif offset == 2:

1943

return self._parents

1944

elif offset == 3:

1945

return self.record_details

1946

else:

1947

raise IndexError('offset out of range')

1948

1949

def __len__(self):

1950

return 4

1951

1952

1812

1953

class _GCGraphIndex(object):

1813

1954

"""Mapper from GroupCompressVersionedFiles needs into GraphIndex storage."""

1814

1955

1843

1984

# repeated over and over, this creates a surplus of ints

1844

1985

self._int_cache = {}

1845

1986

if track_external_parent_refs:

1846

self._key_dependencies = knit._KeyRefs(

1987

self._key_dependencies = _KeyRefs(

1847

1988

track_new_keys=track_new_keys)

1848

1989

else:

1849

1990

self._key_dependencies = None

2009

2150

parents = None

2010

2151

else:

2011

2152

parents = entry[3][0]

2012

method = 'group'

2013

result[key] = (self._node_to_position(entry),

2014

None, parents, (method, None))

2153

details = _GCBuildDetails(parents, self._node_to_position(entry))

2154

result[key] = details

2015

2155

return result

2016

2156

2017

2157

def keys(self):

2033

2173

# each, or about 7MB. Note that it might be even more when you consider

2034

2174

# how PyInt is allocated in separate slabs. And you can't return a slab

2035

2175

# to the OS if even 1 int on it is in use. Note though that Python uses

2036

# a LIFO when re-using PyInt slots, which probably causes more

2176

# a LIFO when re-using PyInt slots, which might cause more

2037

2177

# fragmentation.

2038

2178

start = int(bits[0])

2039

2179

start = self._int_cache.setdefault(start, start)

Older »