/brz/remove-bazaar : revision 1755.3.4

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/transport/http/__init__.py

Committer: Robert Collins
Date: 2006-08-08 23:19:29 UTC
mfrom: (1884 +trunk)
mto: This revision was merged to the branch mainline in revision 1912.
Revision ID: robertc@robertcollins.net-20060808231929-4e3e298190214b3a

current status

files added:
bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/ignores.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/response.py

profile_imports.py

files removed:
foo bar

files renamed:
bzrlib/bundle/read_bundle.py => bzrlib/bundle/bundle_data.py

bzrlib/bundle/serializer/v07.py => bzrlib/bundle/serializer/v08.py

files modified:
.bzrignore

HACKING

Makefile

NEWS

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export/tar_exporter.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/fakenfs.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

doc/README.1st

doc/configuration.txt

doc/setting_up_email.txt

doc/tutorial.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http/__init__.py

There are separate implementation modules for each http client implementation.

"""

from cStringIO import StringIO

import errno

import mimetools

import os

from collections import deque

from cStringIO import StringIO

import posixpath

import re

import sys

import urlparse

import urllib

from warnings import warn

from bzrlib.transport import Transport, register_transport, Server

# TODO: load these only when running http tests

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib import errors

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError, InvalidURL)

from bzrlib.branch import Branch

from bzrlib.trace import mutter

# TODO: load these only when running http tests

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib.transport import Transport, register_transport, Server

from bzrlib.transport.http.response import (HttpMultipartRangeResponse,

HttpRangeResponse)

from bzrlib.ui import ui_factory

return url

def _extract_headers(header_text, url):

"""Extract the mapping for an rfc2822 header

This is a helper function for the test suite and for _pycurl.

(urllib already parses the headers for us)

In the case that there are multiple headers inside the file,

the last one is returned.

:param header_text: A string of header information.

This expects that the first line of a header will always be HTTP ...

:param url: The url we are parsing, so we can raise nice errors

:return: mimetools.Message object, which basically acts like a case

insensitive dictionary.

"""

first_header = True

remaining = header_text

if not remaining:

raise errors.InvalidHttpResponse(url, 'Empty headers')

while remaining:

100

header_file = StringIO(remaining)

101

first_line = header_file.readline()

102

if not first_line.startswith('HTTP'):

103

if first_header: # The first header *must* start with HTTP

104

raise errors.InvalidHttpResponse(url,

105

'Opening header line did not start with HTTP: %s'

106

% (first_line,))

107

assert False, 'Opening header line was not HTTP'

108

else:

109

break # We are done parsing

110

first_header = False

111

m = mimetools.Message(header_file)

112

113

# mimetools.Message parses the first header up to a blank line

114

# So while there is remaining data, it probably means there is

115

# another header to be parsed.

116

# Get rid of any preceeding whitespace, which if it is all whitespace

117

# will get rid of everything.

118

remaining = header_file.read().lstrip()

119

return m

120

121

122

class HttpTransportBase(Transport):

123

"""Base class for http implementations.

124

193

243

:param offsets: A list of (offset, size) tuples.

194

244

:param return: A list or generator of (offset, data) tuples

195

245

"""

196

# Ideally we would pass one big request asking for all the ranges in

197

# one go; however then the server will give a multipart mime response

198

# back, and we can't parse them yet. So instead we just get one range

199

# per region, and try to coallesce the regions as much as possible.

200

201

# The read-coallescing code is not quite regular enough to have a

202

# single driver routine and

203

# helper method in Transport.

204

def do_combined_read(combined_offsets):

205

# read one coalesced block

206

total_size = 0

207

for offset, size in combined_offsets:

208

total_size += size

209

mutter('readv coalesced %d reads.', len(combined_offsets))

210

offset = combined_offsets[0][0]

211

byte_range = (offset, offset + total_size - 1)

212

code, result_file = self._get(relpath, [byte_range])

213

if code == 206:

214

for off, size in combined_offsets:

215

result_bytes = result_file.read(size)

216

assert len(result_bytes) == size

217

yield off, result_bytes

218

elif code == 200:

219

data = result_file.read(offset + total_size)[offset:offset + total_size]

220

pos = 0

221

for offset, size in combined_offsets:

222

yield offset, data[pos:pos + size]

223

pos += size

224

del data

225

if not len(offsets):

226

return

227

pending_offsets = deque(offsets)

228

combined_offsets = []

229

while len(pending_offsets):

230

offset, size = pending_offsets.popleft()

231

if not combined_offsets:

232

combined_offsets = [[offset, size]]

246

ranges = self.offsets_to_ranges(offsets)

247

mutter('http readv of %s collapsed %s offsets => %s',

248

relpath, len(offsets), ranges)

249

code, f = self._get(relpath, ranges)

250

for start, size in offsets:

251

f.seek(start, (start < 0) and 2 or 0)

252

start = f.tell()

253

data = f.read(size)

254

assert len(data) == size

255

yield start, data

256

257

@staticmethod

258

def offsets_to_ranges(offsets):

259

"""Turn a list of offsets and sizes into a list of byte ranges.

260

261

:param offsets: A list of tuples of (start, size). An empty list

262

is not accepted.

263

:return: a list of inclusive byte ranges (start, end)

264

Adjacent ranges will be combined.

265

"""

266

# Make sure we process sorted offsets

267

offsets = sorted(offsets)

268

269

prev_end = None

270

combined = []

271

272

for start, size in offsets:

273

end = start + size - 1

274

if prev_end is None:

275

combined.append([start, end])

276

elif start <= prev_end + 1:

277

combined[-1][1] = end

233

278

else:

234

if (len (combined_offsets) < 500 and

235

combined_offsets[-1][0] + combined_offsets[-1][1] == offset):

236

# combatible offset:

237

combined_offsets.append([offset, size])

238

else:

239

# incompatible, or over the threshold issue a read and yield

240

pending_offsets.appendleft((offset, size))

241

for result in do_combined_read(combined_offsets):

242

yield result

243

combined_offsets = []

244

# whatever is left is a single coalesced request

245

if len(combined_offsets):

246

for result in do_combined_read(combined_offsets):

247

yield result

279

combined.append([start, end])

280

prev_end = end

281

282

return combined

248

283

249

284

def put(self, relpath, f, mode=None):

250

285

"""Copy the file-like or string object into the location.

341

376

else:

342

377

return self.__class__(self.abspath(offset))

343

378

379

@staticmethod

380

def range_header(ranges, tail_amount):

381

"""Turn a list of bytes ranges into a HTTP Range header value.

382

383

:param offsets: A list of byte ranges, (start, end). An empty list

384

is not accepted.

385

386

:return: HTTP range header string.

387

"""

388

strings = []

389

for start, end in ranges:

390

strings.append('%d-%d' % (start, end))

391

392

if tail_amount:

393

strings.append('-%d' % tail_amount)

394

395

return ','.join(strings)

396

397

344

398

#---------------- test server facilities ----------------

345

399

# TODO: load these only when running tests

346

400

398

452

method = getattr(self, mname)

399

453

method()

400

454

455

if sys.platform == 'win32':

456

# On win32 you cannot access non-ascii filenames without

457

# decoding them into unicode first.

458

# However, under Linux, you can access bytestream paths

459

# without any problems. If this function was always active

460

# it would probably break tests when LANG=C was set

461

def translate_path(self, path):

462

"""Translate a /-separated PATH to the local filename syntax.

463

464

For bzr, all url paths are considered to be utf8 paths.

465

On Linux, you can access these paths directly over the bytestream

466

request, but on win32, you must decode them, and access them

467

as Unicode files.

468

"""

469

# abandon query parameters

470

path = urlparse.urlparse(path)[2]

471

path = posixpath.normpath(urllib.unquote(path))

472

path = path.decode('utf-8')

473

words = path.split('/')

474

words = filter(None, words)

475

path = os.getcwdu()

476

for word in words:

477

drive, word = os.path.splitdrive(word)

478

head, word = os.path.split(word)

479

if word in (os.curdir, os.pardir): continue

480

path = os.path.join(path, word)

481

return path

482

401

483

402

484

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

403

485

def __init__(self, server_address, RequestHandlerClass, test_case):

405

487

RequestHandlerClass)

406

488

self.test_case = test_case

407

489

490

408

491

class HttpServer(Server):

409

492

"""A test server for http transports."""

410

493

Older »