/brz/remove-bazaar : revision 2120.7.5

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/transport/http/_pycurl.py

Committer: Aaron Bentley
Date: 2007-03-03 17:17:53 UTC
mfrom: (2309 +trunk)
mto: This revision was merged to the branch mainline in revision 2316.
Revision ID: aaron.bentley@utoronto.ca-20070303171753-o0s1yrxx5sn12p2k

Merge bzr.dev

files added:
bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/help_topics.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/tag.py

bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/transport/chroot.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/wsgi.py

bzrlib/util/bencode.py

doc/bazaar-vcs.org.kid

doc/http_smart_server.txt

tools/rst2prettyhtml.py

files renamed:
bzrlib/tests/test_command.py => bzrlib/tests/test_commands.py

bzrlib/win32console.py => bzrlib/win32utils.py

files modified:
.bzrignore

BRANCH.TODO

HACKING

Makefile

NEWS

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/progress.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/smart.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/workingtree.py

bzrlib/xml5.py

bzrlib/xml6.py

doc/configuration.txt

doc/index.txt

doc/specifying_revisions.txt

doc/tutorial.txt

setup.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http/_pycurl.py

import os

from cStringIO import StringIO

import sys

from bzrlib import errors

from bzrlib import (

errors,

__version__ as bzrlib_version,

)

import bzrlib

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError,

from bzrlib.errors import (NoSuchFile,

ConnectionError,

DependencyNotPresent)

from bzrlib.trace import mutter

from bzrlib.transport import register_urlparse_netloc_protocol

from bzrlib.transport.http import (HttpTransportBase, HttpServer,

_extract_headers,

response, _pycurl_errors)

from bzrlib.transport.http import (

ca_bundle,

_extract_headers,

HttpTransportBase,

_pycurl_errors,

response,

)

try:

import pycurl

PyCurl is a Python binding to the C "curl" multiprotocol client.

This transport can be significantly faster than the builtin Python client.

Advantages include: DNS caching, connection keepalive, and ability to

set headers to allow caching.

This transport can be significantly faster than the builtin

Python client. Advantages include: DNS caching.

"""

def __init__(self, base, from_transport=None):

super(PyCurlTransport, self).__init__(base)

if base.startswith('https'):

# Check availability of https into pycurl supported

# protocols

supported = pycurl.version_info()[8]

if 'https' not in supported:

raise DependencyNotPresent('pycurl', 'no https support')

self.cabundle = ca_bundle.get_ca_path()

if from_transport is not None:

self._base_curl = from_transport._base_curl

self._range_curl = from_transport._range_curl

self._curl = from_transport._curl

else:

mutter('using pycurl %s' % pycurl.version)

self._base_curl = pycurl.Curl()

self._range_curl = pycurl.Curl()

self._curl = pycurl.Curl()

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

103

"""See Transport.has()"""

104

# We set NO BODY=0 in _get_full, so it should be safe

105

# to re-use the non-range curl object

curl = self._base_curl

106

curl = self._curl

107

abspath = self._real_abspath(relpath)

108

curl.setopt(pycurl.URL, abspath)

109

self._set_curl_options(curl)

111

# don't want the body - ie just do a HEAD request

100

112

# This means "NO BODY" not 'nobody'

101

113

curl.setopt(pycurl.NOBODY, 1)

114

# In some erroneous cases, pycurl will emit text on

115

# stdout if we don't catch it (see InvalidStatus tests

116

# for one such occurrence).

117

blackhole = StringIO()

118

curl.setopt(pycurl.WRITEFUNCTION, blackhole.write)

102

119

self._curl_perform(curl)

103

120

code = curl.getinfo(pycurl.HTTP_CODE)

104

121

if code == 404: # not found

107

124

return True

108

125

else:

109

126

self._raise_curl_http_error(curl)

110

127

111

128

def _get(self, relpath, ranges, tail_amount=0):

112

129

# This just switches based on the type of request

113

130

if ranges is not None or tail_amount not in (0, None):

114

131

return self._get_ranged(relpath, ranges, tail_amount=tail_amount)

115

132

else:

116

133

return self._get_full(relpath)

117

134

118

135

def _setup_get_request(self, curl, relpath):

119

136

# Make sure we do a GET request. versions > 7.14.1 also set the

120

137

# NO BODY flag, but we'll do it ourselves in case it is an older

146

163

147

164

def _get_full(self, relpath):

148

165

"""Make a request for the entire file"""

149

curl = self._base_curl

166

curl = self._curl

150

167

abspath, data, header = self._setup_get_request(curl, relpath)

151

168

self._curl_perform(curl)

152

169

156

173

if code == 404:

157

174

raise NoSuchFile(abspath)

158

175

if code != 200:

159

self._raise_curl_http_error(curl, 'expected 200 or 404 for full response.')

176

self._raise_curl_http_error(

177

curl, 'expected 200 or 404 for full response.')

160

178

161

179

return code, data

162

180

163

181

def _get_ranged(self, relpath, ranges, tail_amount):

164

182

"""Make a request for just part of the file."""

165

# We would like to re-use the same curl object for

166

# full requests and partial requests

167

# Documentation says 'Pass in NULL to disable the use of ranges'

168

# None is the closest we have, but at least with pycurl 7.13.1

169

# It raises an 'invalid arguments' response

170

# curl.setopt(pycurl.RANGE, None)

171

# curl.unsetopt(pycurl.RANGE) doesn't support the RANGE parameter

172

# So instead we hack around this by using a separate objects

173

curl = self._range_curl

183

curl = self._curl

174

184

abspath, data, header = self._setup_get_request(curl, relpath)

175

185

176

curl.setopt(pycurl.RANGE, self.range_header(ranges, tail_amount))

177

self._curl_perform(curl)

186

range_header = self.attempted_range_header(ranges, tail_amount)

187

if range_header is None:

188

# Forget ranges, the server can't handle them

189

return self._get_full(relpath)

190

191

self._curl_perform(curl, ['Range: bytes=%s'

192

% self.range_header(ranges, tail_amount)])

178

193

data.seek(0)

179

194

180

195

code = curl.getinfo(pycurl.HTTP_CODE)

185

200

186

201

def _post(self, body_bytes):

187

202

fake_file = StringIO(body_bytes)

188

curl = self._base_curl

203

curl = self._curl

189

204

# Other places that use _base_curl for GET requests explicitly set

190

205

# HTTPGET, so it should be safe to re-use the same object for both GETs

191

206

# and POSTs.

193

208

curl.setopt(pycurl.POSTFIELDSIZE, len(body_bytes))

194

209

curl.setopt(pycurl.READFUNCTION, fake_file.read)

195

210

abspath, data, header = self._setup_request(curl, '.bzr/smart')

196

self._curl_perform(curl)

211

# We override the Expect: header so that pycurl will send the POST

212

# body immediately.

213

self._curl_perform(curl,['Expect: '])

197

214

data.seek(0)

198

215

code = curl.getinfo(pycurl.HTTP_CODE)

199

216

headers = _extract_headers(header.getvalue(), abspath)

202

219

def _raise_curl_http_error(self, curl, info=None):

203

220

code = curl.getinfo(pycurl.HTTP_CODE)

204

221

url = curl.getinfo(pycurl.EFFECTIVE_URL)

205

if info is None:

206

msg = ''

222

# Some error codes can be handled the same way for all

223

# requests

224

if code == 403:

225

raise errors.TransportError(

226

'Server refuses to fullfil the request for: %s' % url)

207

227

else:

208

msg = ': ' + info

209

raise errors.InvalidHttpResponse(url, 'Unable to handle http code %d%s'

210

% (code,msg))

228

if info is None:

229

msg = ''

230

else:

231

msg = ': ' + info

232

raise errors.InvalidHttpResponse(

233

url, 'Unable to handle http code %d%s' % (code,msg))

211

234

212

235

def _set_curl_options(self, curl):

213

236

"""Set options for all requests"""

214

# There's no way in http/1.0 to say "must revalidate"; we don't want

215

# to force it to always retrieve. so just turn off the default Pragma

216

# provided by Curl.

217

# Also, we override the Expect: header so that pycurl will send the POST

218

# body immediately.

219

headers = ['Cache-control: max-age=0',

220

'Pragma: no-cache',

221

'Connection: Keep-Alive',

222

'Expect: ',]

223

237

## curl.setopt(pycurl.VERBOSE, 1)

224

238

# TODO: maybe include a summary of the pycurl version

225

239

ua_str = 'bzr/%s (pycurl)' % (bzrlib.__version__,)

226

240

curl.setopt(pycurl.USERAGENT, ua_str)

227

curl.setopt(pycurl.HTTPHEADER, headers)

228

241

curl.setopt(pycurl.FOLLOWLOCATION, 1) # follow redirect responses

242

if self.cabundle:

243

curl.setopt(pycurl.CAINFO, self.cabundle)

229

244

230

def _curl_perform(self, curl):

245

def _curl_perform(self, curl, more_headers=[]):

231

246

"""Perform curl operation and translate exceptions."""

232

247

try:

248

# There's no way in http/1.0 to say "must

249

# revalidate"; we don't want to force it to always

250

# retrieve. so just turn off the default Pragma

251

# provided by Curl.

252

headers = ['Cache-control: max-age=0',

253

'Pragma: no-cache',

254

'Connection: Keep-Alive']

255

curl.setopt(pycurl.HTTPHEADER, headers + more_headers)

233

256

curl.perform()

234

257

except pycurl.error, e:

235

# XXX: There seem to be no symbolic constants for these values.

236

258

url = curl.getinfo(pycurl.EFFECTIVE_URL)

237

259

mutter('got pycurl error: %s, %s, %s, url: %s ',

238

260

e[0], _pycurl_errors.errorcode[e[0]], e, url)

239

261

if e[0] in (_pycurl_errors.CURLE_COULDNT_RESOLVE_HOST,

240

262

_pycurl_errors.CURLE_COULDNT_CONNECT,

263

_pycurl_errors.CURLE_GOT_NOTHING,

241

264

_pycurl_errors.CURLE_COULDNT_RESOLVE_PROXY):

242

265

raise ConnectionError('curl connection error (%s)\non %s'

243

266

% (e[1], url))

244

# jam 20060713 The code didn't use to re-raise the exception here

267

elif e[0] == _pycurl_errors.CURLE_PARTIAL_FILE:

268

# Pycurl itself has detected a short read. We do

269

# not have all the information for the

270

# ShortReadvError, but that should be enough

271

raise errors.ShortReadvError(url,

272

offset='unknown', length='unknown',

273

actual='unknown',

274

extra='Server aborted the request')

275

# jam 20060713 The code didn't use to re-raise the exception here,

245

276

# but that seemed bogus

246

277

raise

247

278

248

279

249

class HttpServer_PyCurl(HttpServer):

250

"""Subclass of HttpServer that gives http+pycurl urls.

251

252

This is for use in testing: connections to this server will always go

253

through pycurl where possible.

254

"""

255

256

# urls returned by this server should require the pycurl client impl

257

_url_protocol = 'http+pycurl'

258

259

260

280

def get_test_permutations():

261

281

"""Return the permutations to be used in testing."""

282

from bzrlib.tests.HttpServer import HttpServer_PyCurl

262

283

return [(PyCurlTransport, HttpServer_PyCurl),

263

284

]

Older »