/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
2004.1.40 by v.ladeuil+lp at free
Fix the race condition again and correct some small typos to be in
1
# Copyright (C) 2006 Canonical Ltd
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
import BaseHTTPServer
18
import errno
19
import os
20
from SimpleHTTPServer import SimpleHTTPRequestHandler
21
import socket
2146.1.1 by Alexander Belchenko
fixes for test suite: forgotten imports in HttpServer.py
22
import posixpath
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
23
import random
24
import re
25
import sys
26
import threading
27
import time
2146.1.1 by Alexander Belchenko
fixes for test suite: forgotten imports in HttpServer.py
28
import urllib
29
import urlparse
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
30
31
from bzrlib.transport import Server
32
33
34
class WebserverNotAvailable(Exception):
35
    pass
36
37
38
class BadWebserverPath(ValueError):
39
    def __str__(self):
40
        return 'path %s is not in %s' % self.args
41
42
43
class TestingHTTPRequestHandler(SimpleHTTPRequestHandler):
44
45
    def log_message(self, format, *args):
46
        self.server.test_case.log('webserver - %s - - [%s] %s "%s" "%s"',
47
                                  self.address_string(),
48
                                  self.log_date_time_string(),
49
                                  format % args,
50
                                  self.headers.get('referer', '-'),
51
                                  self.headers.get('user-agent', '-'))
52
53
    def handle_one_request(self):
54
        """Handle a single HTTP request.
55
56
        You normally don't need to override this method; see the class
57
        __doc__ string for information on how to handle specific HTTP
58
        commands such as GET and POST.
59
60
        """
61
        for i in xrange(1,11): # Don't try more than 10 times
62
            try:
63
                self.raw_requestline = self.rfile.readline()
64
            except socket.error, e:
65
                if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):
66
                    # omitted for now because some tests look at the log of
67
                    # the server and expect to see no errors.  see recent
68
                    # email thread. -- mbp 20051021. 
69
                    ## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)
70
                    time.sleep(0.01)
71
                    continue
72
                raise
73
            else:
74
                break
75
        if not self.raw_requestline:
76
            self.close_connection = 1
77
            return
78
        if not self.parse_request(): # An error code has been sent, just exit
79
            return
80
        mname = 'do_' + self.command
81
        if getattr(self, mname, None) is None:
82
            self.send_error(501, "Unsupported method (%r)" % self.command)
83
            return
84
        method = getattr(self, mname)
85
        method()
86
87
    _range_regexp = re.compile(r'^(?P<start>\d+)-(?P<end>\d+)$')
88
    _tail_regexp = re.compile(r'^-(?P<tail>\d+)$')
89
90
    def parse_ranges(self, ranges_header):
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
91
        """Parse the range header value and returns ranges and tail.
92
93
        RFC2616 14.35 says that syntactically invalid range
94
        specifiers MUST be ignored. In that case, we return 0 for
95
        tail and [] for ranges.
96
        """
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
97
        tail = 0
98
        ranges = []
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
99
        if not ranges_header.startswith('bytes='):
100
            # Syntactically invalid header
101
            return 0, []
102
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
103
        ranges_header = ranges_header[len('bytes='):]
104
        for range_str in ranges_header.split(','):
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
105
            # FIXME: RFC2616 says end is optional and default to file_size
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
106
            range_match = self._range_regexp.match(range_str)
107
            if range_match is not None:
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
108
                start = int(range_match.group('start'))
109
                end = int(range_match.group('end'))
110
                if start > end:
111
                    # Syntactically invalid range
112
                    return 0, []
113
                ranges.append((start, end))
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
114
            else:
115
                tail_match = self._tail_regexp.match(range_str)
116
                if tail_match is not None:
117
                    tail = int(tail_match.group('tail'))
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
118
                else:
119
                    # Syntactically invalid range
120
                    return 0, []
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
121
        return tail, ranges
122
123
    def send_range_content(self, file, start, length):
124
        file.seek(start)
125
        self.wfile.write(file.read(length))
126
127
    def get_single_range(self, file, file_size, start, end):
128
        self.send_response(206)
129
        length = end - start + 1
130
        self.send_header('Accept-Ranges', 'bytes')
131
        self.send_header("Content-Length", "%d" % length)
132
133
        self.send_header("Content-Type", 'application/octet-stream')
134
        self.send_header("Content-Range", "bytes %d-%d/%d" % (start,
135
                                                              end,
136
                                                              file_size))
137
        self.end_headers()
138
        self.send_range_content(file, start, length)
139
140
    def get_multiple_ranges(self, file, file_size, ranges):
141
        self.send_response(206)
142
        self.send_header('Accept-Ranges', 'bytes')
143
        boundary = "%d" % random.randint(0,0x7FFFFFFF)
144
        self.send_header("Content-Type",
145
                         "multipart/byteranges; boundary=%s" % boundary)
146
        self.end_headers()
147
        for (start, end) in ranges:
148
            self.wfile.write("--%s\r\n" % boundary)
149
            self.send_header("Content-type", 'application/octet-stream')
150
            self.send_header("Content-Range", "bytes %d-%d/%d" % (start,
151
                                                                  end,
152
                                                                  file_size))
153
            self.end_headers()
154
            self.send_range_content(file, start, end - start + 1)
155
            self.wfile.write("--%s\r\n" % boundary)
156
157
    def do_GET(self):
158
        """Serve a GET request.
159
160
        Handles the Range header.
161
        """
162
163
        path = self.translate_path(self.path)
164
        ranges_header_value = self.headers.get('Range')
165
        if ranges_header_value is None or os.path.isdir(path):
166
            # Let the mother class handle most cases
167
            return SimpleHTTPRequestHandler.do_GET(self)
168
169
        try:
170
            # Always read in binary mode. Opening files in text
171
            # mode may cause newline translations, making the
172
            # actual size of the content transmitted *less* than
173
            # the content-length!
174
            file = open(path, 'rb')
175
        except IOError:
176
            self.send_error(404, "File not found")
2000.3.9 by v.ladeuil+lp at free
The tests that would have help avoid bug #73948 and all that mess :)
177
            return
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
178
179
        file_size = os.fstat(file.fileno())[6]
180
        tail, ranges = self.parse_ranges(ranges_header_value)
181
        # Normalize tail into ranges
182
        if tail != 0:
183
            ranges.append((file_size - tail, file_size))
184
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
185
        self._satisfiable_ranges = True
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
186
        if len(ranges) == 0:
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
187
            self._satisfiable_ranges = False
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
188
        else:
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
189
            def check_range(range_specifier):
190
                start, end = range_specifier
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
191
                # RFC2616 14.35, ranges are invalid if start >= file_size
192
                if start >= file_size:
193
                    self._satisfiable_ranges = False # Side-effect !
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
194
                    return 0, 0
195
                # RFC2616 14.35, end values should be truncated
196
                # to file_size -1 if they exceed it
197
                end = min(end, file_size - 1)
198
                return start, end
199
200
            ranges = map(check_range, ranges)
201
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
202
        if not self._satisfiable_ranges:
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
203
            # RFC2616 14.16 and 14.35 says that when a server
204
            # encounters unsatisfiable range specifiers, it
205
            # SHOULD return a 416.
2000.3.9 by v.ladeuil+lp at free
The tests that would have help avoid bug #73948 and all that mess :)
206
            file.close()
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
207
            # FIXME: We SHOULD send a Content-Range header too,
208
            # but the implementation of send_error does not
209
            # allows that. So far.
2000.3.9 by v.ladeuil+lp at free
The tests that would have help avoid bug #73948 and all that mess :)
210
            self.send_error(416, "Requested range not satisfiable")
211
            return
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
212
213
        if len(ranges) == 1:
214
            (start, end) = ranges[0]
215
            self.get_single_range(file, file_size, start, end)
216
        else:
217
            self.get_multiple_ranges(file, file_size, ranges)
218
        file.close()
219
220
    if sys.platform == 'win32':
221
        # On win32 you cannot access non-ascii filenames without
222
        # decoding them into unicode first.
223
        # However, under Linux, you can access bytestream paths
224
        # without any problems. If this function was always active
225
        # it would probably break tests when LANG=C was set
226
        def translate_path(self, path):
227
            """Translate a /-separated PATH to the local filename syntax.
228
229
            For bzr, all url paths are considered to be utf8 paths.
230
            On Linux, you can access these paths directly over the bytestream
231
            request, but on win32, you must decode them, and access them
232
            as Unicode files.
233
            """
234
            # abandon query parameters
235
            path = urlparse.urlparse(path)[2]
236
            path = posixpath.normpath(urllib.unquote(path))
237
            path = path.decode('utf-8')
238
            words = path.split('/')
239
            words = filter(None, words)
240
            path = os.getcwdu()
241
            for word in words:
242
                drive, word = os.path.splitdrive(word)
243
                head, word = os.path.split(word)
244
                if word in (os.curdir, os.pardir): continue
245
                path = os.path.join(path, word)
246
            return path
247
248
249
class TestingHTTPServer(BaseHTTPServer.HTTPServer):
250
    def __init__(self, server_address, RequestHandlerClass, test_case):
251
        BaseHTTPServer.HTTPServer.__init__(self, server_address,
252
                                                RequestHandlerClass)
253
        self.test_case = test_case
254
255
256
class HttpServer(Server):
257
    """A test server for http transports.
258
259
    Subclasses can provide a specific request handler.
260
    """
261
262
    # used to form the url that connects to this server
263
    _url_protocol = 'http'
264
265
    # Subclasses can provide a specific request handler
266
    def __init__(self, request_handler=TestingHTTPRequestHandler):
267
        Server.__init__(self)
268
        self.request_handler = request_handler
2164.2.13 by v.ladeuil+lp at free
Add tests for redirection. Preserve transport decorations.
269
        self.host = 'localhost'
270
        self.port = 0
271
        self._httpd = None
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
272
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
273
    def _get_httpd(self):
2164.2.13 by v.ladeuil+lp at free
Add tests for redirection. Preserve transport decorations.
274
        if self._httpd is None:
275
            self._httpd = TestingHTTPServer((self.host, self.port),
276
                                            self.request_handler,
277
                                            self)
278
            host, self.port = self._httpd.socket.getsockname()
279
        return self._httpd
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
280
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
281
    def _http_start(self):
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
282
        httpd = self._get_httpd()
2164.2.13 by v.ladeuil+lp at free
Add tests for redirection. Preserve transport decorations.
283
        self._http_base_url = '%s://%s:%s/' % (self._url_protocol,
284
                                               self.host,
285
                                               self.port)
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
286
        self._http_starting.release()
287
        httpd.socket.settimeout(0.1)
288
289
        while self._http_running:
290
            try:
291
                httpd.handle_request()
292
            except socket.timeout:
293
                pass
294
295
    def _get_remote_url(self, path):
296
        path_parts = path.split(os.path.sep)
297
        if os.path.isabs(path):
298
            if path_parts[:len(self._local_path_parts)] != \
299
                   self._local_path_parts:
300
                raise BadWebserverPath(path, self.test_dir)
301
            remote_path = '/'.join(path_parts[len(self._local_path_parts):])
302
        else:
303
            remote_path = '/'.join(path_parts)
304
305
        return self._http_base_url + remote_path
306
307
    def log(self, format, *args):
308
        """Capture Server log output."""
309
        self.logs.append(format % args)
310
311
    def setUp(self):
312
        """See bzrlib.transport.Server.setUp."""
313
        self._home_dir = os.getcwdu()
314
        self._local_path_parts = self._home_dir.split(os.path.sep)
315
        self._http_starting = threading.Lock()
316
        self._http_starting.acquire()
317
        self._http_running = True
318
        self._http_base_url = None
319
        self._http_thread = threading.Thread(target=self._http_start)
320
        self._http_thread.setDaemon(True)
2167.3.5 by v.ladeuil+lp at free
Tests for proxies, covering #74759.
321
        self._http_thread.start()
2167.3.6 by v.ladeuil+lp at free
Take John's comments into account and add more tests.
322
        # Wait for the server thread to start (i.e release the lock)
323
        self._http_starting.acquire()
324
        self._http_starting.release()
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
325
        self.logs = []
326
327
    def tearDown(self):
328
        """See bzrlib.transport.Server.tearDown."""
329
        self._http_running = False
330
        self._http_thread.join()
331
332
    def get_url(self):
333
        """See bzrlib.transport.Server.get_url."""
334
        return self._get_remote_url(self._home_dir)
335
336
    def get_bogus_url(self):
337
        """See bzrlib.transport.Server.get_bogus_url."""
338
        # this is chosen to try to prevent trouble with proxies, weird dns,
339
        # etc
340
        return 'http://127.0.0.1:1/'
341
342
343
class HttpServer_urllib(HttpServer):
344
    """Subclass of HttpServer that gives http+urllib urls.
345
346
    This is for use in testing: connections to this server will always go
347
    through urllib where possible.
348
    """
349
350
    # urls returned by this server should require the urllib client impl
351
    _url_protocol = 'http+urllib'
352
353
354
class HttpServer_PyCurl(HttpServer):
355
    """Subclass of HttpServer that gives http+pycurl urls.
356
357
    This is for use in testing: connections to this server will always go
358
    through pycurl where possible.
359
    """
360
361
    # We don't care about checking the pycurl availability as
362
    # this server will be required only when pycurl is present
363
364
    # urls returned by this server should require the pycurl client impl
365
    _url_protocol = 'http+pycurl'