/brz/remove-bazaar : revision 1530.1.7

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2006-01-03 02:07:06 UTC
mfrom: (1533 integration)
mto: (1508.1.17 checkout) (1534.1.6 integration)
mto: This revision was merged to the branch mainline in revision 1543.
Revision ID: robertc@robertcollins.net-20060103020706-998bb02793088bdf

merge integration.

files added:
.bzrignore

.rsyncexclude

HACKING

INSTALL

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr_man.py

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/clone.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_parent.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_remove.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revision_info.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

setup.py

tools

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
.bzrignore

COPYING

HACKING

INSTALL

Makefile

NEWS

README

TODO

__init__.py

branch.py

bzr-receive-pack

bzr-upload-pack

cache.py

commands.py

commit.py

config.py

dir.py

errors.py

fetch.py

help.py

hg.py

info.py

inventory.py

mapping.py

notes

notes/git-serve.txt

notes/mapping.txt

notes/roundtripping.txt

object_store.py

push.py

refs.py

remote.py

repository.py

revspec.py

roundtrip.py

send.py

server.py

setup.py

tests

tests/__init__.py

tests/test_blackbox.py

tests/test_branch.py

tests/test_builder.py

tests/test_cache.py

tests/test_dir.py

tests/test_fetch.py

tests/test_mapping.py

tests/test_object_store.py

tests/test_push.py

tests/test_refs.py

tests/test_remote.py

tests/test_repository.py

tests/test_revspec.py

tests/test_roundtrip.py

tests/test_transportgit.py

transportgit.py

tree.py

versionedfiles.py

workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Implementation of Transport over http.

"""

import os, errno

from cStringIO import StringIO

import urllib, urllib2

import urlparse

from bzrlib.transport import Transport, Server

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError)

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

def extract_auth(url, password_manager):

"""

Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert url.startswith('http://') or url.startswith('https://')

scheme, host = url.split('//', 1)

if '/' in host:

host, path = host.split('/', 1)

path = '/' + path

else:

path = ''

port = ''

if '@' in host:

auth, host = host.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in host:

host, port = host.split(':', 1)

port = ':' + port

# FIXME: if password isn't given, should we ask for it?

if password is not None:

username = urllib.unquote(username)

password = urllib.unquote(password)

password_manager.add_password(None, host, username, password)

url = scheme + '//' + host + port + path

return url

def get_url(url):

import urllib2

mutter("get_url %s" % url)

manager = urllib2.HTTPPasswordMgrWithDefaultRealm()

url = extract_auth(url, manager)

auth_handler = urllib2.HTTPBasicAuthHandler(manager)

opener = urllib2.build_opener(auth_handler)

url_f = opener.open(url)

return url_f

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

def __init__(self, base):

"""Set the base path where files will be stored."""

assert base.startswith('http://') or base.startswith('https://')

if base[-1] != '/':

base = base + '/'

super(HttpTransport, self).__init__(base)

# In the future we might actually connect to the remote host

# rather than using get_url

# self._connection = None

(self._proto, self._host,

self._path, self._parameters,

self._query, self._fragment) = urlparse.urlparse(self.base)

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

For now HttpTransport does not actually connect, so just return

100

a new HttpTransport object.

101

"""

102

if offset is None:

103

return HttpTransport(self.base)

104

else:

105

return HttpTransport(self.abspath(offset))

106

107

def abspath(self, relpath):

108

"""Return the full url to the given relative path.

109

This can be supplied with a string or a list

110

"""

111

assert isinstance(relpath, basestring)

112

if isinstance(relpath, basestring):

113

relpath_parts = relpath.split('/')

114

else:

115

# TODO: Don't call this with an array - no magic interfaces

116

relpath_parts = relpath[:]

117

if len(relpath_parts) > 1:

118

if relpath_parts[0] == '':

119

raise ValueError("path %r within branch %r seems to be absolute"

120

% (relpath, self._path))

121

if relpath_parts[-1] == '':

122

raise ValueError("path %r within branch %r seems to be a directory"

123

% (relpath, self._path))

124

basepath = self._path.split('/')

125

if len(basepath) > 0 and basepath[-1] == '':

126

basepath = basepath[:-1]

127

for p in relpath_parts:

128

if p == '..':

129

if len(basepath) == 0:

130

# In most filesystems, a request for the parent

131

# of root, just returns root.

132

continue

133

basepath.pop()

134

elif p == '.' or p == '':

135

continue # No-op

136

else:

137

basepath.append(p)

138

# Possibly, we could use urlparse.urljoin() here, but

139

# I'm concerned about when it chooses to strip the last

140

# portion of the path, and when it doesn't.

141

path = '/'.join(basepath)

142

return urlparse.urlunparse((self._proto,

143

self._host, path, '', '', ''))

144

145

def has(self, relpath):

146

"""Does the target location exist?

147

148

TODO: HttpTransport.has() should use a HEAD request,

149

not a full GET request.

150

151

TODO: This should be changed so that we don't use

152

urllib2 and get an exception, the code path would be

153

cleaner if we just do an http HEAD request, and parse

154

the return code.

155

"""

156

path = relpath

157

try:

158

path = self.abspath(relpath)

159

f = get_url(path)

160

# Without the read and then close()

161

# we tend to have busy sockets.

162

f.read()

163

f.close()

164

return True

165

except urllib2.URLError, e:

166

mutter('url error code: %s for has url: %r', e.code, path)

167

if e.code == 404:

168

return False

169

raise

170

except IOError, e:

171

mutter('io error: %s %s for has url: %r',

172

e.errno, errno.errorcode.get(e.errno), path)

173

if e.errno == errno.ENOENT:

174

return False

175

raise TransportError(orig_error=e)

176

177

def get(self, relpath, decode=False):

178

"""Get the file at the given relative path.

179

180

:param relpath: The relative path to the file

181

"""

182

path = relpath

183

try:

184

path = self.abspath(relpath)

185

return get_url(path)

186

except urllib2.HTTPError, e:

187

mutter('url error code: %s for has url: %r', e.code, path)

188

if e.code == 404:

189

raise NoSuchFile(path, extra=e)

190

raise

191

except (BzrError, IOError), e:

192

if hasattr(e, 'errno'):

193

mutter('io error: %s %s for has url: %r',

194

e.errno, errno.errorcode.get(e.errno), path)

195

if e.errno == errno.ENOENT:

196

raise NoSuchFile(path, extra=e)

197

raise ConnectionError(msg = "Error retrieving %s: %s"

198

% (self.abspath(relpath), str(e)),

199

orig_error=e)

200

201

def put(self, relpath, f, mode=None):

202

"""Copy the file-like or string object into the location.

203

204

:param relpath: Location to put the contents, relative to base.

205

:param f: File-like or string object.

206

"""

207

raise TransportNotPossible('http PUT not supported')

208

209

def mkdir(self, relpath, mode=None):

210

"""Create a directory at the given path."""

211

raise TransportNotPossible('http does not support mkdir()')

212

213

def append(self, relpath, f):

214

"""Append the text in the file-like object into the final

215

location.

216

"""

217

raise TransportNotPossible('http does not support append()')

218

219

def copy(self, rel_from, rel_to):

220

"""Copy the item at rel_from to the location at rel_to"""

221

raise TransportNotPossible('http does not support copy()')

222

223

def copy_to(self, relpaths, other, mode=None, pb=None):

224

"""Copy a set of entries from self into another Transport.

225

226

:param relpaths: A list/generator of entries to be copied.

227

228

TODO: if other is LocalTransport, is it possible to

229

do better than put(get())?

230

"""

231

# At this point HttpTransport might be able to check and see if

232

# the remote location is the same, and rather than download, and

233

# then upload, it could just issue a remote copy_this command.

234

if isinstance(other, HttpTransport):

235

raise TransportNotPossible('http cannot be the target of copy_to()')

236

else:

237

return super(HttpTransport, self).copy_to(relpaths, other, mode=mode, pb=pb)

238

239

def move(self, rel_from, rel_to):

240

"""Move the item at rel_from to the location at rel_to"""

241

raise TransportNotPossible('http does not support move()')

242

243

def delete(self, relpath):

244

"""Delete the item at relpath"""

245

raise TransportNotPossible('http does not support delete()')

246

247

def is_readonly(self):

248

"""See Transport.is_readonly."""

249

return True

250

251

def listable(self):

252

"""See Transport.listable."""

253

return False

254

255

def stat(self, relpath):

256

"""Return the stat information for a file.

257

"""

258

raise TransportNotPossible('http does not support stat()')

259

260

def lock_read(self, relpath):

261

"""Lock the given file for shared (read) access.

262

:return: A lock object, which should be passed to Transport.unlock()

263

"""

264

# The old RemoteBranch ignore lock for reading, so we will

265

# continue that tradition and return a bogus lock object.

266

class BogusLock(object):

267

def __init__(self, path):

268

self.path = path

269

def unlock(self):

270

pass

271

return BogusLock(relpath)

272

273

def lock_write(self, relpath):

274

"""Lock the given file for exclusive (write) access.

275

WARNING: many transports do not support this, so trying avoid using it

276

277

:return: A lock object, which should be passed to Transport.unlock()

278

"""

279

raise TransportNotPossible('http does not support lock_write()')

280

281

282

#---------------- test server facilities ----------------

283

import BaseHTTPServer, SimpleHTTPServer, socket, time

284

import threading

285

286

287

class WebserverNotAvailable(Exception):

288

pass

289

290

291

class BadWebserverPath(ValueError):

292

def __str__(self):

293

return 'path %s is not in %s' % self.args

294

295

296

class TestingHTTPRequestHandler(SimpleHTTPServer.SimpleHTTPRequestHandler):

297

298

def log_message(self, format, *args):

299

self.server.test_case.log("webserver - %s - - [%s] %s",

300

self.address_string(),

301

self.log_date_time_string(),

302

format%args)

303

304

def handle_one_request(self):

305

"""Handle a single HTTP request.

306

307

You normally don't need to override this method; see the class

308

__doc__ string for information on how to handle specific HTTP

309

commands such as GET and POST.

310

311

"""

312

for i in xrange(1,11): # Don't try more than 10 times

313

try:

314

self.raw_requestline = self.rfile.readline()

315

except socket.error, e:

316

if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):

317

# omitted for now because some tests look at the log of

318

# the server and expect to see no errors. see recent

319

# email thread. -- mbp 20051021.

320

## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)

321

time.sleep(0.01)

322

continue

323

raise

324

else:

325

break

326

if not self.raw_requestline:

327

self.close_connection = 1

328

return

329

if not self.parse_request(): # An error code has been sent, just exit

330

return

331

mname = 'do_' + self.command

332

if not hasattr(self, mname):

333

self.send_error(501, "Unsupported method (%r)" % self.command)

334

return

335

method = getattr(self, mname)

336

method()

337

338

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

339

def __init__(self, server_address, RequestHandlerClass, test_case):

340

BaseHTTPServer.HTTPServer.__init__(self, server_address,

341

RequestHandlerClass)

342

self.test_case = test_case

343

344

345

class HttpServer(Server):

346

"""A test server for http transports."""

347

348

_HTTP_PORTS = range(13000, 0x8000)

349

350

def _http_start(self):

351

httpd = None

352

for port in self._HTTP_PORTS:

353

try:

354

httpd = TestingHTTPServer(('localhost', port),

355

TestingHTTPRequestHandler,

356

self)

357

except socket.error, e:

358

if e.args[0] == errno.EADDRINUSE:

359

continue

360

print >>sys.stderr, "Cannot run webserver :-("

361

raise

362

else:

363

break

364

365

if httpd is None:

366

raise WebserverNotAvailable("Cannot run webserver :-( "

367

"no free ports in range %s..%s" %

368

(_HTTP_PORTS[0], _HTTP_PORTS[-1]))

369

370

self._http_base_url = 'http://localhost:%s/' % port

371

self._http_starting.release()

372

httpd.socket.settimeout(0.1)

373

374

while self._http_running:

375

try:

376

httpd.handle_request()

377

except socket.timeout:

378

pass

379

380

def _get_remote_url(self, path):

381

path_parts = path.split(os.path.sep)

382

if os.path.isabs(path):

383

if path_parts[:len(self._local_path_parts)] != \

384

self._local_path_parts:

385

raise BadWebserverPath(path, self.test_dir)

386

remote_path = '/'.join(path_parts[len(self._local_path_parts):])

387

else:

388

remote_path = '/'.join(path_parts)

389

390

self._http_starting.acquire()

391

self._http_starting.release()

392

return self._http_base_url + remote_path

393

394

def log(self, *args, **kwargs):

395

"""Capture Server log output."""

396

397

def setUp(self):

398

"""See bzrlib.transport.Server.setUp."""

399

self._home_dir = os.getcwdu()

400

self._local_path_parts = self._home_dir.split(os.path.sep)

401

self._http_starting = threading.Lock()

402

self._http_starting.acquire()

403

self._http_running = True

404

self._http_base_url = None

405

self._http_thread = threading.Thread(target=self._http_start)

406

self._http_thread.setDaemon(True)

407

self._http_thread.start()

408

self._http_proxy = os.environ.get("http_proxy")

409

if self._http_proxy is not None:

410

del os.environ["http_proxy"]

411

412

def tearDown(self):

413

"""See bzrlib.transport.Server.tearDown."""

414

self._http_running = False

415

self._http_thread.join()

416

if self._http_proxy is not None:

417

import os

418

os.environ["http_proxy"] = self._http_proxy

419

420

def get_url(self):

421

"""See bzrlib.transport.Server.get_url."""

422

return self._get_remote_url(self._home_dir)

Older »