/brz/remove-bazaar : revision 2625.11.3

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/pack.py

Committer: Martin Pool
Date: 2007-09-14 06:31:28 UTC
mfrom: (2822 +trunk)
mto: This revision was merged to the branch mainline in revision 2823.
Revision ID: mbp@sourcefrog.net-20070914063128-0p7mh6zfb4pzdg9p

merge trunk

files added:
bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_patiencediff_c.c

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_pack.py

bzrlib/bundle/serializer/v4.py

bzrlib/email_message.py

bzrlib/mail_client.py

bzrlib/multiparent.py

bzrlib/patiencediff.py

bzrlib/plugins/multiparent.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/transport_util.py

bzrlib/transport/unlistable.py

bzrlib/util/simplemapi.py

doc/developers/bundle-format4.txt

doc/developers/directory-fingerprints.txt

doc/developers/last-modified.txt

doc/developers/missing.txt

doc/developers/revision-properties.txt

doc/developers/update.txt

doc/en

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/user-guide

doc/en/user-guide/conflicts.txt

doc/en/user-guide/hooks.txt

doc/en/user-reference

doc/en/user-reference/hooks.txt

doc/en/user-reference/index.txt

doc/index.txt

tools/win32/survey.txt

files removed:
bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

doc/README.1st

doc/developers/scratch.txt

files renamed:
bzrlib/patiencediff.py => bzrlib/_patiencediff_py.py

bzrlib/tests/blackbox/test_bundle.py => bzrlib/tests/blackbox/test_send.py

doc/developers/HACKING => doc/developers/HACKING.txt

doc/bug_trackers.txt => doc/en/user-guide/bug_trackers.txt

doc/centralized_workflow.txt => doc/en/user-guide/centralized_workflow.txt

doc/configuration.txt => doc/en/user-guide/configuration.txt

doc/http_smart_server.txt => doc/en/user-guide/http_smart_server.txt

doc/index.txt => doc/en/user-guide/index.txt

doc/plugins.txt => doc/en/user-guide/plugins.txt

doc/server.txt => doc/en/user-guide/server.txt

doc/setting_up_email.txt => doc/en/user-guide/setting_up_email.txt

doc/shared_repository_layouts.txt => doc/en/user-guide/shared_repository_layouts.txt

doc/specifying_revisions.txt => doc/en/user-guide/specifying_revisions.txt

doc/tutorial.txt => doc/en/user-guide/tutorial.txt

doc/using_aliases.txt => doc/en/user-guide/using_aliases.txt

doc/version_info.txt => doc/en/user-guide/version_info.txt

files modified:
.bzrignore

INSTALL

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/help.py

bzrlib/help_topics.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/reconcile.py

bzrlib/remote.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/smart/client.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/server.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_index.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers/bundles.txt

doc/developers/index.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap.txt

doc/developers/performance.dot

doc/developers/profiling.txt

doc/developers/repository.txt

setup.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/pack.py

"Containers" and "records" are described in doc/developers/container-format.txt.

"""

from cStringIO import StringIO

import re

from bzrlib import errors

class ContainerWriter(object):

"""A class for writing containers."""

"""A class for writing containers.

:attribute records_written: The number of user records added to the

container. This does not count the prelude or suffix of the container

introduced by the begin() and end() methods.

"""

def __init__(self, write_func):

"""Constructor.

:param write_func: a callable that will be called when this

ContainerWriter needs to write some bytes.

"""

self.write_func = write_func

self._write_func = write_func

self.current_offset = 0

self.records_written = 0

def begin(self):

"""Begin writing a container."""

self.write_func(FORMAT_ONE + "\n")

def write_func(self, bytes):

self._write_func(bytes)

self.current_offset += len(bytes)

def end(self):

"""Finish writing a container."""

self.write_func("E")

def add_bytes_record(self, bytes, names):

"""Add a Bytes record with the given names."""

"""Add a Bytes record with the given names.

:param bytes: The bytes to insert.

:param names: The names to give the inserted bytes. Each name is

a tuple of bytestrings. The bytestrings may not contain

whitespace.

:return: An offset, length tuple. The offset is the offset

of the record within the container, and the length is the

100

length of data that will need to be read to reconstitute the

101

record. These offset and length can only be used with the pack

102

interface - they might be offset by headers or other such details

103

and thus are only suitable for use by a ContainerReader.

104

"""

105

current_offset = self.current_offset

106

# Kind marker

self.write_func("B")

107

byte_sections = ["B"]

108

# Length

self.write_func(str(len(bytes)) + "\n")

109

byte_sections.append(str(len(bytes)) + "\n")

110

# Names

for name in names:

111

for name_tuple in names:

112

# Make sure we're writing valid names. Note that we will leave a

113

# half-written record if a name is bad!

_check_name(name)

self.write_func(name + "\n")

114

for name in name_tuple:

115

_check_name(name)

116

byte_sections.append('\x00'.join(name_tuple) + "\n")

117

# End of headers

self.write_func("\n")

118

byte_sections.append("\n")

119

# Finally, the contents.

self.write_func(bytes)

120

byte_sections.append(bytes)

121

# XXX: This causes a memory copy of bytes in size, but is usually

122

# faster than two write calls (12 vs 13 seconds to output a gig of

123

# 1k records.) - results may differ on significantly larger records

124

# like .iso's but as they should be rare in any case and thus not

125

# likely to be the common case. The biggest issue is causing extreme

126

# memory pressure in that case. One possibly improvement here is to

127

# check the size of the content before deciding to join here vs call

128

# write twice.

129

self.write_func(''.join(byte_sections))

130

self.records_written += 1

131

# return a memo of where we wrote data to allow random access.

132

return current_offset, self.current_offset - current_offset

133

134

135

class ReadVFile(object):

136

"""Adapt a readv result iterator to a file like protocol."""

137

138

def __init__(self, readv_result):

139

self.readv_result = readv_result

140

# the most recent readv result block

141

self._string = None

142

143

def _next(self):

144

if (self._string is None or

145

self._string.tell() == self._string_length):

146

length, data = self.readv_result.next()

147

self._string_length = len(data)

148

self._string = StringIO(data)

149

150

def read(self, length):

151

self._next()

152

result = self._string.read(length)

153

if len(result) < length:

154

raise errors.BzrError('request for too much data from a readv hunk.')

155

return result

156

157

def readline(self):

158

"""Note that readline will not cross readv segments."""

159

self._next()

160

result = self._string.readline()

161

if self._string.tell() == self._string_length and result[-1] != '\n':

162

raise errors.BzrError('short readline in the readvfile hunk.')

163

return result

164

165

166

def make_readv_reader(transport, filename, requested_records):

167

"""Create a ContainerReader that will read selected records only.

168

169

:param transport: The transport the pack file is located on.

170

:param filename: The filename of the pack file.

171

:param requested_records: The record offset, length tuples as returned

172

by add_bytes_record for the desired records.

173

"""

174

readv_blocks = [(0, len(FORMAT_ONE)+1)]

175

readv_blocks.extend(requested_records)

176

result = ContainerReader(ReadVFile(

177

transport.readv(filename, readv_blocks)))

178

return result

179

180

181

class BaseReader(object):

197

281

all_names = set()

198

282

for record_names, read_bytes in self.iter_records():

199

283

read_bytes(None)

200

for name in record_names:

201

_check_name_encoding(name)

284

for name_tuple in record_names:

285

for name in name_tuple:

286

_check_name_encoding(name)

202

287

# Check that the name is unique. Note that Python will refuse

203

288

# to decode non-shortest forms of UTF-8 encoding, so there is no

204

289

# risk that the same unicode string has been encoded two

205

290

# different ways.

206

if name in all_names:

207

raise errors.DuplicateRecordNameError(name)

208

all_names.add(name)

291

if name_tuple in all_names:

292

raise errors.DuplicateRecordNameError(name_tuple)

293

all_names.add(name_tuple)

209

294

excess_bytes = self.reader_func(1)

210

295

if excess_bytes != '':

211

296

raise errors.ContainerHasExcessDataError(excess_bytes)

235

320

# Read the list of names.

236

321

names = []

237

322

while True:

238

name = self._read_line()

239

if name == '':

323

name_line = self._read_line()

324

if name_line == '':

240

325

break

241

_check_name(name)

242

names.append(name)

326

name_tuple = tuple(name_line.split('\x00'))

327

for name in name_tuple:

328

_check_name(name)

329

names.append(name_tuple)

243

330

244

331

self._remaining_length = length

245

332

return names, self._content_reader

263

350

:raises ContainerError: if this record is invalid.

264

351

"""

265

352

names, read_bytes = self.read()

266

for name in names:

267

_check_name_encoding(name)

353

for name_tuple in names:

354

for name in name_tuple:

355

_check_name_encoding(name)

268

356

read_bytes(None)

269

357

Older »