/brz/remove-bazaar : revision 1786.1.42

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/transport/http/__init__.py

Committer: John Arbash Meinel
Date: 2006-07-19 14:17:49 UTC
mto: This revision was merged to the branch mainline in revision 1869.
Revision ID: john@arbash-meinel.com-20060719141749-5c8a2a433f966f29

Update _extract_headers, make it less generic, and non recursive.

files modified:
bzrlib/tests/test_http_response.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http/__init__.py

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib import errors

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError, InvalidURL)

from bzrlib.branch import Branch

return url

def _extract_headers(header_file, skip_first=True, body_is_header=True):

"""Extract the mapping for an rfc822 header

def _extract_headers(header_text, url):

"""Extract the mapping for an rfc2822 header

This is a helper function for the test suite, and for _pycurl.

This is a helper function for the test suite and for _pycurl.

(urllib already parses the headers for us)

:param header_file: A file-like object to read

:param skip_first: HTTP headers start with the HTTP response as

the first line. Skip this line while parsing

:param body_is_header: When pycurl gets a redirect request, it saves

both the redirect headers and the final headers in the header

file. Which means we really want the latter headers, not the

former.

:return: mimetools.Message object

In the case that there are multiple headers inside the file,

the last one is returned.

:param header_text: A string of header information.

This expects that the first line of a header will always be HTTP ...

:param url: The url we are parsing, so we can raise nice errors

:return: mimetools.Message object, which basically acts like a case

insensitive dictionary.

"""

header_file.seek(0, 0)

if skip_first:

header_file.readline()

m = mimetools.Message(header_file)

if body_is_header:

m.rewindbody()

remaining = header_file.read()

# Ignore some extra whitespace, but if we have acutal content

100

# lines, then the later content superceeds the eariler.

101

if remaining.strip() != '':

102

return _extract_headers(StringIO(remaining), skip_first=skip_first,

103

body_is_header=True)

first_header = True

remaining = header_text

if not remaining:

raise errors.InvalidHttpResponse(url, 'Empty headers')

while remaining:

100

header_file = StringIO(remaining)

101

first_line = header_file.readline()

102

if not first_line.startswith('HTTP'):

103

if first_header: # The first header *must* start with HTTP

104

raise errors.InvalidHttpResponse(url,

105

'Opening header line did not start with HTTP: %s'

106

% (first_line,))

107

assert False, 'Opening header line was not HTTP'

108

else:

109

break # We are done parsing

110

first_header = False

111

m = mimetools.Message(header_file)

112

113

# mimetools.Message parses the first header up to a blank line

114

# So while there is remaining data, it probably means there is

115

# another header to be parsed.

116

# Get rid of any preceeding whitespace, which if it is all whitespace

117

# will get rid of everything.

118

remaining = header_file.read().lstrip()

104

119

return m

105

120

106

121

Older »