1import unittest
2from test import test_support
3
4import os
5import socket
6import StringIO
7
8import urllib2
9from urllib2 import Request, OpenerDirector
10
11# XXX
12# Request
13# CacheFTPHandler (hard to write)
14# parse_keqv_list, parse_http_list, HTTPDigestAuthHandler
15
16class TrivialTests(unittest.TestCase):
17    def test_trivial(self):
18        # A couple trivial tests
19
20        self.assertRaises(ValueError, urllib2.urlopen, 'bogus url')
21
22        # XXX Name hacking to get this to work on Windows.
23        fname = os.path.abspath(urllib2.__file__).replace('\\', '/')
24
25        # And more hacking to get it to work on MacOS. This assumes
26        # urllib.pathname2url works, unfortunately...
27        if os.name == 'riscos':
28            import string
29            fname = os.expand(fname)
30            fname = fname.translate(string.maketrans("/.", "./"))
31
32        if os.name == 'nt':
33            file_url = "file:///%s" % fname
34        else:
35            file_url = "file://%s" % fname
36
37        f = urllib2.urlopen(file_url)
38
39        buf = f.read()
40        f.close()
41
42    def test_parse_http_list(self):
43        tests = [('a,b,c', ['a', 'b', 'c']),
44                 ('path"o,l"og"i"cal, example', ['path"o,l"og"i"cal', 'example']),
45                 ('a, b, "c", "d", "e,f", g, h', ['a', 'b', '"c"', '"d"', '"e,f"', 'g', 'h']),
46                 ('a="b\\"c", d="e\\,f", g="h\\\\i"', ['a="b"c"', 'd="e,f"', 'g="h\\i"'])]
47        for string, list in tests:
48            self.assertEqual(urllib2.parse_http_list(string), list)
49
50
51def test_request_headers_dict():
52    """
53    The Request.headers dictionary is not a documented interface.  It should
54    stay that way, because the complete set of headers are only accessible
55    through the .get_header(), .has_header(), .header_items() interface.
56    However, .headers pre-dates those methods, and so real code will be using
57    the dictionary.
58
59    The introduction in 2.4 of those methods was a mistake for the same reason:
60    code that previously saw all (urllib2 user)-provided headers in .headers
61    now sees only a subset (and the function interface is ugly and incomplete).
62    A better change would have been to replace .headers dict with a dict
63    subclass (or UserDict.DictMixin instance?)  that preserved the .headers
64    interface and also provided access to the "unredirected" headers.  It's
65    probably too late to fix that, though.
66
67
68    Check .capitalize() case normalization:
69
70    >>> url = "http://example.com"
71    >>> Request(url, headers={"Spam-eggs": "blah"}).headers["Spam-eggs"]
72    'blah'
73    >>> Request(url, headers={"spam-EggS": "blah"}).headers["Spam-eggs"]
74    'blah'
75
76    Currently, Request(url, "Spam-eggs").headers["Spam-Eggs"] raises KeyError,
77    but that could be changed in future.
78
79    """
80
81def test_request_headers_methods():
82    """
83    Note the case normalization of header names here, to .capitalize()-case.
84    This should be preserved for backwards-compatibility.  (In the HTTP case,
85    normalization to .title()-case is done by urllib2 before sending headers to
86    httplib).
87
88    >>> url = "http://example.com"
89    >>> r = Request(url, headers={"Spam-eggs": "blah"})
90    >>> r.has_header("Spam-eggs")
91    True
92    >>> r.header_items()
93    [('Spam-eggs', 'blah')]
94    >>> r.add_header("Foo-Bar", "baz")
95    >>> items = r.header_items()
96    >>> items.sort()
97    >>> items
98    [('Foo-bar', 'baz'), ('Spam-eggs', 'blah')]
99
100    Note that e.g. r.has_header("spam-EggS") is currently False, and
101    r.get_header("spam-EggS") returns None, but that could be changed in
102    future.
103
104    >>> r.has_header("Not-there")
105    False
106    >>> print r.get_header("Not-there")
107    None
108    >>> r.get_header("Not-there", "default")
109    'default'
110
111    """
112
113
114def test_password_manager(self):
115    """
116    >>> mgr = urllib2.HTTPPasswordMgr()
117    >>> add = mgr.add_password
118    >>> add("Some Realm", "http://example.com/", "joe", "password")
119    >>> add("Some Realm", "http://example.com/ni", "ni", "ni")
120    >>> add("c", "http://example.com/foo", "foo", "ni")
121    >>> add("c", "http://example.com/bar", "bar", "nini")
122    >>> add("b", "http://example.com/", "first", "blah")
123    >>> add("b", "http://example.com/", "second", "spam")
124    >>> add("a", "http://example.com", "1", "a")
125    >>> add("Some Realm", "http://c.example.com:3128", "3", "c")
126    >>> add("Some Realm", "d.example.com", "4", "d")
127    >>> add("Some Realm", "e.example.com:3128", "5", "e")
128
129    >>> mgr.find_user_password("Some Realm", "example.com")
130    ('joe', 'password')
131    >>> mgr.find_user_password("Some Realm", "http://example.com")
132    ('joe', 'password')
133    >>> mgr.find_user_password("Some Realm", "http://example.com/")
134    ('joe', 'password')
135    >>> mgr.find_user_password("Some Realm", "http://example.com/spam")
136    ('joe', 'password')
137    >>> mgr.find_user_password("Some Realm", "http://example.com/spam/spam")
138    ('joe', 'password')
139    >>> mgr.find_user_password("c", "http://example.com/foo")
140    ('foo', 'ni')
141    >>> mgr.find_user_password("c", "http://example.com/bar")
142    ('bar', 'nini')
143
144    Actually, this is really undefined ATM
145##     Currently, we use the highest-level path where more than one match:
146
147##     >>> mgr.find_user_password("Some Realm", "http://example.com/ni")
148##     ('joe', 'password')
149
150    Use latest add_password() in case of conflict:
151
152    >>> mgr.find_user_password("b", "http://example.com/")
153    ('second', 'spam')
154
155    No special relationship between a.example.com and example.com:
156
157    >>> mgr.find_user_password("a", "http://example.com/")
158    ('1', 'a')
159    >>> mgr.find_user_password("a", "http://a.example.com/")
160    (None, None)
161
162    Ports:
163
164    >>> mgr.find_user_password("Some Realm", "c.example.com")
165    (None, None)
166    >>> mgr.find_user_password("Some Realm", "c.example.com:3128")
167    ('3', 'c')
168    >>> mgr.find_user_password("Some Realm", "http://c.example.com:3128")
169    ('3', 'c')
170    >>> mgr.find_user_password("Some Realm", "d.example.com")
171    ('4', 'd')
172    >>> mgr.find_user_password("Some Realm", "e.example.com:3128")
173    ('5', 'e')
174
175    """
176    pass
177
178
179def test_password_manager_default_port(self):
180    """
181    >>> mgr = urllib2.HTTPPasswordMgr()
182    >>> add = mgr.add_password
183
184    The point to note here is that we can't guess the default port if there's
185    no scheme.  This applies to both add_password and find_user_password.
186
187    >>> add("f", "http://g.example.com:80", "10", "j")
188    >>> add("g", "http://h.example.com", "11", "k")
189    >>> add("h", "i.example.com:80", "12", "l")
190    >>> add("i", "j.example.com", "13", "m")
191    >>> mgr.find_user_password("f", "g.example.com:100")
192    (None, None)
193    >>> mgr.find_user_password("f", "g.example.com:80")
194    ('10', 'j')
195    >>> mgr.find_user_password("f", "g.example.com")
196    (None, None)
197    >>> mgr.find_user_password("f", "http://g.example.com:100")
198    (None, None)
199    >>> mgr.find_user_password("f", "http://g.example.com:80")
200    ('10', 'j')
201    >>> mgr.find_user_password("f", "http://g.example.com")
202    ('10', 'j')
203    >>> mgr.find_user_password("g", "h.example.com")
204    ('11', 'k')
205    >>> mgr.find_user_password("g", "h.example.com:80")
206    ('11', 'k')
207    >>> mgr.find_user_password("g", "http://h.example.com:80")
208    ('11', 'k')
209    >>> mgr.find_user_password("h", "i.example.com")
210    (None, None)
211    >>> mgr.find_user_password("h", "i.example.com:80")
212    ('12', 'l')
213    >>> mgr.find_user_password("h", "http://i.example.com:80")
214    ('12', 'l')
215    >>> mgr.find_user_password("i", "j.example.com")
216    ('13', 'm')
217    >>> mgr.find_user_password("i", "j.example.com:80")
218    (None, None)
219    >>> mgr.find_user_password("i", "http://j.example.com")
220    ('13', 'm')
221    >>> mgr.find_user_password("i", "http://j.example.com:80")
222    (None, None)
223
224    """
225
226class MockOpener:
227    addheaders = []
228    def open(self, req, data=None,timeout=socket._GLOBAL_DEFAULT_TIMEOUT):
229        self.req, self.data, self.timeout  = req, data, timeout
230    def error(self, proto, *args):
231        self.proto, self.args = proto, args
232
233class MockFile:
234    def read(self, count=None): pass
235    def readline(self, count=None): pass
236    def close(self): pass
237
238class MockHeaders(dict):
239    def getheaders(self, name):
240        return self.values()
241
242class MockResponse(StringIO.StringIO):
243    def __init__(self, code, msg, headers, data, url=None):
244        StringIO.StringIO.__init__(self, data)
245        self.code, self.msg, self.headers, self.url = code, msg, headers, url
246    def info(self):
247        return self.headers
248    def geturl(self):
249        return self.url
250
251class MockCookieJar:
252    def add_cookie_header(self, request):
253        self.ach_req = request
254    def extract_cookies(self, response, request):
255        self.ec_req, self.ec_r = request, response
256
257class FakeMethod:
258    def __init__(self, meth_name, action, handle):
259        self.meth_name = meth_name
260        self.handle = handle
261        self.action = action
262    def __call__(self, *args):
263        return self.handle(self.meth_name, self.action, *args)
264
265class MockHTTPResponse:
266    def __init__(self, fp, msg, status, reason):
267        self.fp = fp
268        self.msg = msg
269        self.status = status
270        self.reason = reason
271    def read(self):
272        return ''
273
274class MockHTTPClass:
275    def __init__(self):
276        self.req_headers = []
277        self.data = None
278        self.raise_on_endheaders = False
279        self._tunnel_headers = {}
280
281    def __call__(self, host, timeout=socket._GLOBAL_DEFAULT_TIMEOUT):
282        self.host = host
283        self.timeout = timeout
284        return self
285
286    def set_debuglevel(self, level):
287        self.level = level
288
289    def set_tunnel(self, host, port=None, headers=None):
290        self._tunnel_host = host
291        self._tunnel_port = port
292        if headers:
293            self._tunnel_headers = headers
294        else:
295            self._tunnel_headers.clear()
296    def request(self, method, url, body=None, headers=None):
297        self.method = method
298        self.selector = url
299        if headers is not None:
300            self.req_headers += headers.items()
301        self.req_headers.sort()
302        if body:
303            self.data = body
304        if self.raise_on_endheaders:
305            import socket
306            raise socket.error()
307    def getresponse(self):
308        return MockHTTPResponse(MockFile(), {}, 200, "OK")
309
310class MockHandler:
311    # useful for testing handler machinery
312    # see add_ordered_mock_handlers() docstring
313    handler_order = 500
314    def __init__(self, methods):
315        self._define_methods(methods)
316    def _define_methods(self, methods):
317        for spec in methods:
318            if len(spec) == 2: name, action = spec
319            else: name, action = spec, None
320            meth = FakeMethod(name, action, self.handle)
321            setattr(self.__class__, name, meth)
322    def handle(self, fn_name, action, *args, **kwds):
323        self.parent.calls.append((self, fn_name, args, kwds))
324        if action is None:
325            return None
326        elif action == "return self":
327            return self
328        elif action == "return response":
329            res = MockResponse(200, "OK", {}, "")
330            return res
331        elif action == "return request":
332            return Request("http://blah/")
333        elif action.startswith("error"):
334            code = action[action.rfind(" ")+1:]
335            try:
336                code = int(code)
337            except ValueError:
338                pass
339            res = MockResponse(200, "OK", {}, "")
340            return self.parent.error("http", args[0], res, code, "", {})
341        elif action == "raise":
342            raise urllib2.URLError("blah")
343        assert False
344    def close(self): pass
345    def add_parent(self, parent):
346        self.parent = parent
347        self.parent.calls = []
348    def __lt__(self, other):
349        if not hasattr(other, "handler_order"):
350            # No handler_order, leave in original order.  Yuck.
351            return True
352        return self.handler_order < other.handler_order
353
354def add_ordered_mock_handlers(opener, meth_spec):
355    """Create MockHandlers and add them to an OpenerDirector.
356
357    meth_spec: list of lists of tuples and strings defining methods to define
358    on handlers.  eg:
359
360    [["http_error", "ftp_open"], ["http_open"]]
361
362    defines methods .http_error() and .ftp_open() on one handler, and
363    .http_open() on another.  These methods just record their arguments and
364    return None.  Using a tuple instead of a string causes the method to
365    perform some action (see MockHandler.handle()), eg:
366
367    [["http_error"], [("http_open", "return request")]]
368
369    defines .http_error() on one handler (which simply returns None), and
370    .http_open() on another handler, which returns a Request object.
371
372    """
373    handlers = []
374    count = 0
375    for meths in meth_spec:
376        class MockHandlerSubclass(MockHandler): pass
377        h = MockHandlerSubclass(meths)
378        h.handler_order += count
379        h.add_parent(opener)
380        count = count + 1
381        handlers.append(h)
382        opener.add_handler(h)
383    return handlers
384
385def build_test_opener(*handler_instances):
386    opener = OpenerDirector()
387    for h in handler_instances:
388        opener.add_handler(h)
389    return opener
390
391class MockHTTPHandler(urllib2.BaseHandler):
392    # useful for testing redirections and auth
393    # sends supplied headers and code as first response
394    # sends 200 OK as second response
395    def __init__(self, code, headers):
396        self.code = code
397        self.headers = headers
398        self.reset()
399    def reset(self):
400        self._count = 0
401        self.requests = []
402    def http_open(self, req):
403        import mimetools, httplib, copy
404        from StringIO import StringIO
405        self.requests.append(copy.deepcopy(req))
406        if self._count == 0:
407            self._count = self._count + 1
408            name = httplib.responses[self.code]
409            msg = mimetools.Message(StringIO(self.headers))
410            return self.parent.error(
411                "http", req, MockFile(), self.code, name, msg)
412        else:
413            self.req = req
414            msg = mimetools.Message(StringIO("\r\n\r\n"))
415            return MockResponse(200, "OK", msg, "", req.get_full_url())
416
417class MockHTTPSHandler(urllib2.AbstractHTTPHandler):
418    # Useful for testing the Proxy-Authorization request by verifying the
419    # properties of httpcon
420
421    def __init__(self):
422        urllib2.AbstractHTTPHandler.__init__(self)
423        self.httpconn = MockHTTPClass()
424
425    def https_open(self, req):
426        return self.do_open(self.httpconn, req)
427
428class MockPasswordManager:
429    def add_password(self, realm, uri, user, password):
430        self.realm = realm
431        self.url = uri
432        self.user = user
433        self.password = password
434    def find_user_password(self, realm, authuri):
435        self.target_realm = realm
436        self.target_url = authuri
437        return self.user, self.password
438
439
440class OpenerDirectorTests(unittest.TestCase):
441
442    def test_add_non_handler(self):
443        class NonHandler(object):
444            pass
445        self.assertRaises(TypeError,
446                          OpenerDirector().add_handler, NonHandler())
447
448    def test_badly_named_methods(self):
449        # test work-around for three methods that accidentally follow the
450        # naming conventions for handler methods
451        # (*_open() / *_request() / *_response())
452
453        # These used to call the accidentally-named methods, causing a
454        # TypeError in real code; here, returning self from these mock
455        # methods would either cause no exception, or AttributeError.
456
457        from urllib2 import URLError
458
459        o = OpenerDirector()
460        meth_spec = [
461            [("do_open", "return self"), ("proxy_open", "return self")],
462            [("redirect_request", "return self")],
463            ]
464        handlers = add_ordered_mock_handlers(o, meth_spec)
465        o.add_handler(urllib2.UnknownHandler())
466        for scheme in "do", "proxy", "redirect":
467            self.assertRaises(URLError, o.open, scheme+"://example.com/")
468
469    def test_handled(self):
470        # handler returning non-None means no more handlers will be called
471        o = OpenerDirector()
472        meth_spec = [
473            ["http_open", "ftp_open", "http_error_302"],
474            ["ftp_open"],
475            [("http_open", "return self")],
476            [("http_open", "return self")],
477            ]
478        handlers = add_ordered_mock_handlers(o, meth_spec)
479
480        req = Request("http://example.com/")
481        r = o.open(req)
482        # Second .http_open() gets called, third doesn't, since second returned
483        # non-None.  Handlers without .http_open() never get any methods called
484        # on them.
485        # In fact, second mock handler defining .http_open() returns self
486        # (instead of response), which becomes the OpenerDirector's return
487        # value.
488        self.assertEqual(r, handlers[2])
489        calls = [(handlers[0], "http_open"), (handlers[2], "http_open")]
490        for expected, got in zip(calls, o.calls):
491            handler, name, args, kwds = got
492            self.assertEqual((handler, name), expected)
493            self.assertEqual(args, (req,))
494
495    def test_handler_order(self):
496        o = OpenerDirector()
497        handlers = []
498        for meths, handler_order in [
499            ([("http_open", "return self")], 500),
500            (["http_open"], 0),
501            ]:
502            class MockHandlerSubclass(MockHandler): pass
503            h = MockHandlerSubclass(meths)
504            h.handler_order = handler_order
505            handlers.append(h)
506            o.add_handler(h)
507
508        r = o.open("http://example.com/")
509        # handlers called in reverse order, thanks to their sort order
510        self.assertEqual(o.calls[0][0], handlers[1])
511        self.assertEqual(o.calls[1][0], handlers[0])
512
513    def test_raise(self):
514        # raising URLError stops processing of request
515        o = OpenerDirector()
516        meth_spec = [
517            [("http_open", "raise")],
518            [("http_open", "return self")],
519            ]
520        handlers = add_ordered_mock_handlers(o, meth_spec)
521
522        req = Request("http://example.com/")
523        self.assertRaises(urllib2.URLError, o.open, req)
524        self.assertEqual(o.calls, [(handlers[0], "http_open", (req,), {})])
525
526##     def test_error(self):
527##         # XXX this doesn't actually seem to be used in standard library,
528##         #  but should really be tested anyway...
529
530    def test_http_error(self):
531        # XXX http_error_default
532        # http errors are a special case
533        o = OpenerDirector()
534        meth_spec = [
535            [("http_open", "error 302")],
536            [("http_error_400", "raise"), "http_open"],
537            [("http_error_302", "return response"), "http_error_303",
538             "http_error"],
539            [("http_error_302")],
540            ]
541        handlers = add_ordered_mock_handlers(o, meth_spec)
542
543        class Unknown:
544            def __eq__(self, other): return True
545
546        req = Request("http://example.com/")
547        r = o.open(req)
548        assert len(o.calls) == 2
549        calls = [(handlers[0], "http_open", (req,)),
550                 (handlers[2], "http_error_302",
551                  (req, Unknown(), 302, "", {}))]
552        for expected, got in zip(calls, o.calls):
553            handler, method_name, args = expected
554            self.assertEqual((handler, method_name), got[:2])
555            self.assertEqual(args, got[2])
556
557    def test_processors(self):
558        # *_request / *_response methods get called appropriately
559        o = OpenerDirector()
560        meth_spec = [
561            [("http_request", "return request"),
562             ("http_response", "return response")],
563            [("http_request", "return request"),
564             ("http_response", "return response")],
565            ]
566        handlers = add_ordered_mock_handlers(o, meth_spec)
567
568        req = Request("http://example.com/")
569        r = o.open(req)
570        # processor methods are called on *all* handlers that define them,
571        # not just the first handler that handles the request
572        calls = [
573            (handlers[0], "http_request"), (handlers[1], "http_request"),
574            (handlers[0], "http_response"), (handlers[1], "http_response")]
575
576        for i, (handler, name, args, kwds) in enumerate(o.calls):
577            if i < 2:
578                # *_request
579                self.assertEqual((handler, name), calls[i])
580                self.assertEqual(len(args), 1)
581                self.assertIsInstance(args[0], Request)
582            else:
583                # *_response
584                self.assertEqual((handler, name), calls[i])
585                self.assertEqual(len(args), 2)
586                self.assertIsInstance(args[0], Request)
587                # response from opener.open is None, because there's no
588                # handler that defines http_open to handle it
589                self.assertTrue(args[1] is None or
590                             isinstance(args[1], MockResponse))
591
592
593def sanepathname2url(path):
594    import urllib
595    urlpath = urllib.pathname2url(path)
596    if os.name == "nt" and urlpath.startswith("///"):
597        urlpath = urlpath[2:]
598    # XXX don't ask me about the mac...
599    return urlpath
600
601class HandlerTests(unittest.TestCase):
602
603    def test_ftp(self):
604        class MockFTPWrapper:
605            def __init__(self, data): self.data = data
606            def retrfile(self, filename, filetype):
607                self.filename, self.filetype = filename, filetype
608                return StringIO.StringIO(self.data), len(self.data)
609
610        class NullFTPHandler(urllib2.FTPHandler):
611            def __init__(self, data): self.data = data
612            def connect_ftp(self, user, passwd, host, port, dirs,
613                            timeout=socket._GLOBAL_DEFAULT_TIMEOUT):
614                self.user, self.passwd = user, passwd
615                self.host, self.port = host, port
616                self.dirs = dirs
617                self.ftpwrapper = MockFTPWrapper(self.data)
618                return self.ftpwrapper
619
620        import ftplib
621        data = "rheum rhaponicum"
622        h = NullFTPHandler(data)
623        o = h.parent = MockOpener()
624
625        for url, host, port, user, passwd, type_, dirs, filename, mimetype in [
626            ("ftp://localhost/foo/bar/baz.html",
627             "localhost", ftplib.FTP_PORT, "", "", "I",
628             ["foo", "bar"], "baz.html", "text/html"),
629            ("ftp://parrot@localhost/foo/bar/baz.html",
630             "localhost", ftplib.FTP_PORT, "parrot", "", "I",
631             ["foo", "bar"], "baz.html", "text/html"),
632            ("ftp://%25parrot@localhost/foo/bar/baz.html",
633             "localhost", ftplib.FTP_PORT, "%parrot", "", "I",
634             ["foo", "bar"], "baz.html", "text/html"),
635            ("ftp://%2542parrot@localhost/foo/bar/baz.html",
636             "localhost", ftplib.FTP_PORT, "%42parrot", "", "I",
637             ["foo", "bar"], "baz.html", "text/html"),
638            ("ftp://localhost:80/foo/bar/",
639             "localhost", 80, "", "", "D",
640             ["foo", "bar"], "", None),
641            ("ftp://localhost/baz.gif;type=a",
642             "localhost", ftplib.FTP_PORT, "", "", "A",
643             [], "baz.gif", None),  # XXX really this should guess image/gif
644            ]:
645            req = Request(url)
646            req.timeout = None
647            r = h.ftp_open(req)
648            # ftp authentication not yet implemented by FTPHandler
649            self.assertEqual(h.user, user)
650            self.assertEqual(h.passwd, passwd)
651            self.assertEqual(h.host, socket.gethostbyname(host))
652            self.assertEqual(h.port, port)
653            self.assertEqual(h.dirs, dirs)
654            self.assertEqual(h.ftpwrapper.filename, filename)
655            self.assertEqual(h.ftpwrapper.filetype, type_)
656            headers = r.info()
657            self.assertEqual(headers.get("Content-type"), mimetype)
658            self.assertEqual(int(headers["Content-length"]), len(data))
659
660    def test_file(self):
661        import rfc822, socket
662        h = urllib2.FileHandler()
663        o = h.parent = MockOpener()
664
665        TESTFN = test_support.TESTFN
666        urlpath = sanepathname2url(os.path.abspath(TESTFN))
667        towrite = "hello, world\n"
668        urls = [
669            "file://localhost%s" % urlpath,
670            "file://%s" % urlpath,
671            "file://%s%s" % (socket.gethostbyname('localhost'), urlpath),
672            ]
673        try:
674            localaddr = socket.gethostbyname(socket.gethostname())
675        except socket.gaierror:
676            localaddr = ''
677        if localaddr:
678            urls.append("file://%s%s" % (localaddr, urlpath))
679
680        for url in urls:
681            f = open(TESTFN, "wb")
682            try:
683                try:
684                    f.write(towrite)
685                finally:
686                    f.close()
687
688                r = h.file_open(Request(url))
689                try:
690                    data = r.read()
691                    headers = r.info()
692                    respurl = r.geturl()
693                finally:
694                    r.close()
695                stats = os.stat(TESTFN)
696                modified = rfc822.formatdate(stats.st_mtime)
697            finally:
698                os.remove(TESTFN)
699            self.assertEqual(data, towrite)
700            self.assertEqual(headers["Content-type"], "text/plain")
701            self.assertEqual(headers["Content-length"], "13")
702            self.assertEqual(headers["Last-modified"], modified)
703            self.assertEqual(respurl, url)
704
705        for url in [
706            "file://localhost:80%s" % urlpath,
707            "file:///file_does_not_exist.txt",
708            "file://%s:80%s/%s" % (socket.gethostbyname('localhost'),
709                                   os.getcwd(), TESTFN),
710            "file://somerandomhost.ontheinternet.com%s/%s" %
711            (os.getcwd(), TESTFN),
712            ]:
713            try:
714                f = open(TESTFN, "wb")
715                try:
716                    f.write(towrite)
717                finally:
718                    f.close()
719
720                self.assertRaises(urllib2.URLError,
721                                  h.file_open, Request(url))
722            finally:
723                os.remove(TESTFN)
724
725        h = urllib2.FileHandler()
726        o = h.parent = MockOpener()
727        # XXXX why does // mean ftp (and /// mean not ftp!), and where
728        #  is file: scheme specified?  I think this is really a bug, and
729        #  what was intended was to distinguish between URLs like:
730        # file:/blah.txt (a file)
731        # file://localhost/blah.txt (a file)
732        # file:///blah.txt (a file)
733        # file://ftp.example.com/blah.txt (an ftp URL)
734        for url, ftp in [
735            ("file://ftp.example.com//foo.txt", True),
736            ("file://ftp.example.com///foo.txt", False),
737# XXXX bug: fails with OSError, should be URLError
738            ("file://ftp.example.com/foo.txt", False),
739            ("file://somehost//foo/something.txt", True),
740            ("file://localhost//foo/something.txt", False),
741            ]:
742            req = Request(url)
743            try:
744                h.file_open(req)
745            # XXXX remove OSError when bug fixed
746            except (urllib2.URLError, OSError):
747                self.assertTrue(not ftp)
748            else:
749                self.assertTrue(o.req is req)
750                self.assertEqual(req.type, "ftp")
751            self.assertEqual(req.type == "ftp", ftp)
752
753    def test_http(self):
754
755        h = urllib2.AbstractHTTPHandler()
756        o = h.parent = MockOpener()
757
758        url = "http://example.com/"
759        for method, data in [("GET", None), ("POST", "blah")]:
760            req = Request(url, data, {"Foo": "bar"})
761            req.timeout = None
762            req.add_unredirected_header("Spam", "eggs")
763            http = MockHTTPClass()
764            r = h.do_open(http, req)
765
766            # result attributes
767            r.read; r.readline  # wrapped MockFile methods
768            r.info; r.geturl  # addinfourl methods
769            r.code, r.msg == 200, "OK"  # added from MockHTTPClass.getreply()
770            hdrs = r.info()
771            hdrs.get; hdrs.has_key  # r.info() gives dict from .getreply()
772            self.assertEqual(r.geturl(), url)
773
774            self.assertEqual(http.host, "example.com")
775            self.assertEqual(http.level, 0)
776            self.assertEqual(http.method, method)
777            self.assertEqual(http.selector, "/")
778            self.assertEqual(http.req_headers,
779                             [("Connection", "close"),
780                              ("Foo", "bar"), ("Spam", "eggs")])
781            self.assertEqual(http.data, data)
782
783        # check socket.error converted to URLError
784        http.raise_on_endheaders = True
785        self.assertRaises(urllib2.URLError, h.do_open, http, req)
786
787        # check adding of standard headers
788        o.addheaders = [("Spam", "eggs")]
789        for data in "", None:  # POST, GET
790            req = Request("http://example.com/", data)
791            r = MockResponse(200, "OK", {}, "")
792            newreq = h.do_request_(req)
793            if data is None:  # GET
794                self.assertNotIn("Content-length", req.unredirected_hdrs)
795                self.assertNotIn("Content-type", req.unredirected_hdrs)
796            else:  # POST
797                self.assertEqual(req.unredirected_hdrs["Content-length"], "0")
798                self.assertEqual(req.unredirected_hdrs["Content-type"],
799                             "application/x-www-form-urlencoded")
800            # XXX the details of Host could be better tested
801            self.assertEqual(req.unredirected_hdrs["Host"], "example.com")
802            self.assertEqual(req.unredirected_hdrs["Spam"], "eggs")
803
804            # don't clobber existing headers
805            req.add_unredirected_header("Content-length", "foo")
806            req.add_unredirected_header("Content-type", "bar")
807            req.add_unredirected_header("Host", "baz")
808            req.add_unredirected_header("Spam", "foo")
809            newreq = h.do_request_(req)
810            self.assertEqual(req.unredirected_hdrs["Content-length"], "foo")
811            self.assertEqual(req.unredirected_hdrs["Content-type"], "bar")
812            self.assertEqual(req.unredirected_hdrs["Host"], "baz")
813            self.assertEqual(req.unredirected_hdrs["Spam"], "foo")
814
815    def test_http_doubleslash(self):
816        # Checks that the presence of an unnecessary double slash in a url doesn't break anything
817        # Previously, a double slash directly after the host could cause incorrect parsing of the url
818        h = urllib2.AbstractHTTPHandler()
819        o = h.parent = MockOpener()
820
821        data = ""
822        ds_urls = [
823            "http://example.com/foo/bar/baz.html",
824            "http://example.com//foo/bar/baz.html",
825            "http://example.com/foo//bar/baz.html",
826            "http://example.com/foo/bar//baz.html",
827        ]
828
829        for ds_url in ds_urls:
830            ds_req = Request(ds_url, data)
831
832            # Check whether host is determined correctly if there is no proxy
833            np_ds_req = h.do_request_(ds_req)
834            self.assertEqual(np_ds_req.unredirected_hdrs["Host"],"example.com")
835
836            # Check whether host is determined correctly if there is a proxy
837            ds_req.set_proxy("someproxy:3128",None)
838            p_ds_req = h.do_request_(ds_req)
839            self.assertEqual(p_ds_req.unredirected_hdrs["Host"],"example.com")
840
841    def test_fixpath_in_weirdurls(self):
842        # Issue4493: urllib2 to supply '/' when to urls where path does not
843        # start with'/'
844
845        h = urllib2.AbstractHTTPHandler()
846        o = h.parent = MockOpener()
847
848        weird_url = 'http://www.python.org?getspam'
849        req = Request(weird_url)
850        newreq = h.do_request_(req)
851        self.assertEqual(newreq.get_host(),'www.python.org')
852        self.assertEqual(newreq.get_selector(),'/?getspam')
853
854        url_without_path = 'http://www.python.org'
855        req = Request(url_without_path)
856        newreq = h.do_request_(req)
857        self.assertEqual(newreq.get_host(),'www.python.org')
858        self.assertEqual(newreq.get_selector(),'')
859
860    def test_errors(self):
861        h = urllib2.HTTPErrorProcessor()
862        o = h.parent = MockOpener()
863
864        url = "http://example.com/"
865        req = Request(url)
866        # all 2xx are passed through
867        r = MockResponse(200, "OK", {}, "", url)
868        newr = h.http_response(req, r)
869        self.assertTrue(r is newr)
870        self.assertTrue(not hasattr(o, "proto"))  # o.error not called
871        r = MockResponse(202, "Accepted", {}, "", url)
872        newr = h.http_response(req, r)
873        self.assertTrue(r is newr)
874        self.assertTrue(not hasattr(o, "proto"))  # o.error not called
875        r = MockResponse(206, "Partial content", {}, "", url)
876        newr = h.http_response(req, r)
877        self.assertTrue(r is newr)
878        self.assertTrue(not hasattr(o, "proto"))  # o.error not called
879        # anything else calls o.error (and MockOpener returns None, here)
880        r = MockResponse(502, "Bad gateway", {}, "", url)
881        self.assertTrue(h.http_response(req, r) is None)
882        self.assertEqual(o.proto, "http")  # o.error called
883        self.assertEqual(o.args, (req, r, 502, "Bad gateway", {}))
884
885    def test_cookies(self):
886        cj = MockCookieJar()
887        h = urllib2.HTTPCookieProcessor(cj)
888        o = h.parent = MockOpener()
889
890        req = Request("http://example.com/")
891        r = MockResponse(200, "OK", {}, "")
892        newreq = h.http_request(req)
893        self.assertTrue(cj.ach_req is req is newreq)
894        self.assertEqual(req.get_origin_req_host(), "example.com")
895        self.assertTrue(not req.is_unverifiable())
896        newr = h.http_response(req, r)
897        self.assertTrue(cj.ec_req is req)
898        self.assertTrue(cj.ec_r is r is newr)
899
900    def test_redirect(self):
901        from_url = "http://example.com/a.html"
902        to_url = "http://example.com/b.html"
903        h = urllib2.HTTPRedirectHandler()
904        o = h.parent = MockOpener()
905
906        # ordinary redirect behaviour
907        for code in 301, 302, 303, 307:
908            for data in None, "blah\nblah\n":
909                method = getattr(h, "http_error_%s" % code)
910                req = Request(from_url, data)
911                req.add_header("Nonsense", "viking=withhold")
912                req.timeout = socket._GLOBAL_DEFAULT_TIMEOUT
913                if data is not None:
914                    req.add_header("Content-Length", str(len(data)))
915                req.add_unredirected_header("Spam", "spam")
916                try:
917                    method(req, MockFile(), code, "Blah",
918                           MockHeaders({"location": to_url}))
919                except urllib2.HTTPError:
920                    # 307 in response to POST requires user OK
921                    self.assertTrue(code == 307 and data is not None)
922                self.assertEqual(o.req.get_full_url(), to_url)
923                try:
924                    self.assertEqual(o.req.get_method(), "GET")
925                except AttributeError:
926                    self.assertTrue(not o.req.has_data())
927
928                # now it's a GET, there should not be headers regarding content
929                # (possibly dragged from before being a POST)
930                headers = [x.lower() for x in o.req.headers]
931                self.assertNotIn("content-length", headers)
932                self.assertNotIn("content-type", headers)
933
934                self.assertEqual(o.req.headers["Nonsense"],
935                                 "viking=withhold")
936                self.assertNotIn("Spam", o.req.headers)
937                self.assertNotIn("Spam", o.req.unredirected_hdrs)
938
939        # loop detection
940        req = Request(from_url)
941        req.timeout = socket._GLOBAL_DEFAULT_TIMEOUT
942        def redirect(h, req, url=to_url):
943            h.http_error_302(req, MockFile(), 302, "Blah",
944                             MockHeaders({"location": url}))
945        # Note that the *original* request shares the same record of
946        # redirections with the sub-requests caused by the redirections.
947
948        # detect infinite loop redirect of a URL to itself
949        req = Request(from_url, origin_req_host="example.com")
950        count = 0
951        req.timeout = socket._GLOBAL_DEFAULT_TIMEOUT
952        try:
953            while 1:
954                redirect(h, req, "http://example.com/")
955                count = count + 1
956        except urllib2.HTTPError:
957            # don't stop until max_repeats, because cookies may introduce state
958            self.assertEqual(count, urllib2.HTTPRedirectHandler.max_repeats)
959
960        # detect endless non-repeating chain of redirects
961        req = Request(from_url, origin_req_host="example.com")
962        count = 0
963        req.timeout = socket._GLOBAL_DEFAULT_TIMEOUT
964        try:
965            while 1:
966                redirect(h, req, "http://example.com/%d" % count)
967                count = count + 1
968        except urllib2.HTTPError:
969            self.assertEqual(count,
970                             urllib2.HTTPRedirectHandler.max_redirections)
971
972    def test_invalid_redirect(self):
973        from_url = "http://example.com/a.html"
974        valid_schemes = ['http', 'https', 'ftp']
975        invalid_schemes = ['file', 'imap', 'ldap']
976        schemeless_url = "example.com/b.html"
977        h = urllib2.HTTPRedirectHandler()
978        o = h.parent = MockOpener()
979        req = Request(from_url)
980        req.timeout = socket._GLOBAL_DEFAULT_TIMEOUT
981
982        for scheme in invalid_schemes:
983            invalid_url = scheme + '://' + schemeless_url
984            self.assertRaises(urllib2.HTTPError, h.http_error_302,
985                              req, MockFile(), 302, "Security Loophole",
986                              MockHeaders({"location": invalid_url}))
987
988        for scheme in valid_schemes:
989            valid_url = scheme + '://' + schemeless_url
990            h.http_error_302(req, MockFile(), 302, "That's fine",
991                MockHeaders({"location": valid_url}))
992            self.assertEqual(o.req.get_full_url(), valid_url)
993
994    def test_cookie_redirect(self):
995        # cookies shouldn't leak into redirected requests
996        from cookielib import CookieJar
997
998        from test.test_cookielib import interact_netscape
999
1000        cj = CookieJar()
1001        interact_netscape(cj, "http://www.example.com/", "spam=eggs")
1002        hh = MockHTTPHandler(302, "Location: http://www.cracker.com/\r\n\r\n")
1003        hdeh = urllib2.HTTPDefaultErrorHandler()
1004        hrh = urllib2.HTTPRedirectHandler()
1005        cp = urllib2.HTTPCookieProcessor(cj)
1006        o = build_test_opener(hh, hdeh, hrh, cp)
1007        o.open("http://www.example.com/")
1008        self.assertTrue(not hh.req.has_header("Cookie"))
1009
1010    def test_redirect_fragment(self):
1011        redirected_url = 'http://www.example.com/index.html#OK\r\n\r\n'
1012        hh = MockHTTPHandler(302, 'Location: ' + redirected_url)
1013        hdeh = urllib2.HTTPDefaultErrorHandler()
1014        hrh = urllib2.HTTPRedirectHandler()
1015        o = build_test_opener(hh, hdeh, hrh)
1016        fp = o.open('http://www.example.com')
1017        self.assertEqual(fp.geturl(), redirected_url.strip())
1018
1019    def test_proxy(self):
1020        o = OpenerDirector()
1021        ph = urllib2.ProxyHandler(dict(http="proxy.example.com:3128"))
1022        o.add_handler(ph)
1023        meth_spec = [
1024            [("http_open", "return response")]
1025            ]
1026        handlers = add_ordered_mock_handlers(o, meth_spec)
1027
1028        req = Request("http://acme.example.com/")
1029        self.assertEqual(req.get_host(), "acme.example.com")
1030        r = o.open(req)
1031        self.assertEqual(req.get_host(), "proxy.example.com:3128")
1032
1033        self.assertEqual([(handlers[0], "http_open")],
1034                         [tup[0:2] for tup in o.calls])
1035
1036    def test_proxy_no_proxy(self):
1037        os.environ['no_proxy'] = 'python.org'
1038        o = OpenerDirector()
1039        ph = urllib2.ProxyHandler(dict(http="proxy.example.com"))
1040        o.add_handler(ph)
1041        req = Request("http://www.perl.org/")
1042        self.assertEqual(req.get_host(), "www.perl.org")
1043        r = o.open(req)
1044        self.assertEqual(req.get_host(), "proxy.example.com")
1045        req = Request("http://www.python.org")
1046        self.assertEqual(req.get_host(), "www.python.org")
1047        r = o.open(req)
1048        self.assertEqual(req.get_host(), "www.python.org")
1049        del os.environ['no_proxy']
1050
1051
1052    def test_proxy_https(self):
1053        o = OpenerDirector()
1054        ph = urllib2.ProxyHandler(dict(https='proxy.example.com:3128'))
1055        o.add_handler(ph)
1056        meth_spec = [
1057            [("https_open","return response")]
1058        ]
1059        handlers = add_ordered_mock_handlers(o, meth_spec)
1060        req = Request("https://www.example.com/")
1061        self.assertEqual(req.get_host(), "www.example.com")
1062        r = o.open(req)
1063        self.assertEqual(req.get_host(), "proxy.example.com:3128")
1064        self.assertEqual([(handlers[0], "https_open")],
1065                         [tup[0:2] for tup in o.calls])
1066
1067    def test_proxy_https_proxy_authorization(self):
1068        o = OpenerDirector()
1069        ph = urllib2.ProxyHandler(dict(https='proxy.example.com:3128'))
1070        o.add_handler(ph)
1071        https_handler = MockHTTPSHandler()
1072        o.add_handler(https_handler)
1073        req = Request("https://www.example.com/")
1074        req.add_header("Proxy-Authorization","FooBar")
1075        req.add_header("User-Agent","Grail")
1076        self.assertEqual(req.get_host(), "www.example.com")
1077        self.assertIsNone(req._tunnel_host)
1078        r = o.open(req)
1079        # Verify Proxy-Authorization gets tunneled to request.
1080        # httpsconn req_headers do not have the Proxy-Authorization header but
1081        # the req will have.
1082        self.assertNotIn(("Proxy-Authorization","FooBar"),
1083                         https_handler.httpconn.req_headers)
1084        self.assertIn(("User-Agent","Grail"),
1085                      https_handler.httpconn.req_headers)
1086        self.assertIsNotNone(req._tunnel_host)
1087        self.assertEqual(req.get_host(), "proxy.example.com:3128")
1088        self.assertEqual(req.get_header("Proxy-authorization"),"FooBar")
1089
1090    def test_basic_auth(self, quote_char='"'):
1091        opener = OpenerDirector()
1092        password_manager = MockPasswordManager()
1093        auth_handler = urllib2.HTTPBasicAuthHandler(password_manager)
1094        realm = "ACME Widget Store"
1095        http_handler = MockHTTPHandler(
1096            401, 'WWW-Authenticate: Basic realm=%s%s%s\r\n\r\n' %
1097            (quote_char, realm, quote_char) )
1098        opener.add_handler(auth_handler)
1099        opener.add_handler(http_handler)
1100        self._test_basic_auth(opener, auth_handler, "Authorization",
1101                              realm, http_handler, password_manager,
1102                              "http://acme.example.com/protected",
1103                              "http://acme.example.com/protected",
1104                              )
1105
1106    def test_basic_auth_with_single_quoted_realm(self):
1107        self.test_basic_auth(quote_char="'")
1108
1109    def test_proxy_basic_auth(self):
1110        opener = OpenerDirector()
1111        ph = urllib2.ProxyHandler(dict(http="proxy.example.com:3128"))
1112        opener.add_handler(ph)
1113        password_manager = MockPasswordManager()
1114        auth_handler = urllib2.ProxyBasicAuthHandler(password_manager)
1115        realm = "ACME Networks"
1116        http_handler = MockHTTPHandler(
1117            407, 'Proxy-Authenticate: Basic realm="%s"\r\n\r\n' % realm)
1118        opener.add_handler(auth_handler)
1119        opener.add_handler(http_handler)
1120        self._test_basic_auth(opener, auth_handler, "Proxy-authorization",
1121                              realm, http_handler, password_manager,
1122                              "http://acme.example.com:3128/protected",
1123                              "proxy.example.com:3128",
1124                              )
1125
1126    def test_basic_and_digest_auth_handlers(self):
1127        # HTTPDigestAuthHandler threw an exception if it couldn't handle a 40*
1128        # response (http://python.org/sf/1479302), where it should instead
1129        # return None to allow another handler (especially
1130        # HTTPBasicAuthHandler) to handle the response.
1131
1132        # Also (http://python.org/sf/14797027, RFC 2617 section 1.2), we must
1133        # try digest first (since it's the strongest auth scheme), so we record
1134        # order of calls here to check digest comes first:
1135        class RecordingOpenerDirector(OpenerDirector):
1136            def __init__(self):
1137                OpenerDirector.__init__(self)
1138                self.recorded = []
1139            def record(self, info):
1140                self.recorded.append(info)
1141        class TestDigestAuthHandler(urllib2.HTTPDigestAuthHandler):
1142            def http_error_401(self, *args, **kwds):
1143                self.parent.record("digest")
1144                urllib2.HTTPDigestAuthHandler.http_error_401(self,
1145                                                             *args, **kwds)
1146        class TestBasicAuthHandler(urllib2.HTTPBasicAuthHandler):
1147            def http_error_401(self, *args, **kwds):
1148                self.parent.record("basic")
1149                urllib2.HTTPBasicAuthHandler.http_error_401(self,
1150                                                            *args, **kwds)
1151
1152        opener = RecordingOpenerDirector()
1153        password_manager = MockPasswordManager()
1154        digest_handler = TestDigestAuthHandler(password_manager)
1155        basic_handler = TestBasicAuthHandler(password_manager)
1156        realm = "ACME Networks"
1157        http_handler = MockHTTPHandler(
1158            401, 'WWW-Authenticate: Basic realm="%s"\r\n\r\n' % realm)
1159        opener.add_handler(basic_handler)
1160        opener.add_handler(digest_handler)
1161        opener.add_handler(http_handler)
1162
1163        # check basic auth isn't blocked by digest handler failing
1164        self._test_basic_auth(opener, basic_handler, "Authorization",
1165                              realm, http_handler, password_manager,
1166                              "http://acme.example.com/protected",
1167                              "http://acme.example.com/protected",
1168                              )
1169        # check digest was tried before basic (twice, because
1170        # _test_basic_auth called .open() twice)
1171        self.assertEqual(opener.recorded, ["digest", "basic"]*2)
1172
1173    def _test_basic_auth(self, opener, auth_handler, auth_header,
1174                         realm, http_handler, password_manager,
1175                         request_url, protected_url):
1176        import base64
1177        user, password = "wile", "coyote"
1178
1179        # .add_password() fed through to password manager
1180        auth_handler.add_password(realm, request_url, user, password)
1181        self.assertEqual(realm, password_manager.realm)
1182        self.assertEqual(request_url, password_manager.url)
1183        self.assertEqual(user, password_manager.user)
1184        self.assertEqual(password, password_manager.password)
1185
1186        r = opener.open(request_url)
1187
1188        # should have asked the password manager for the username/password
1189        self.assertEqual(password_manager.target_realm, realm)
1190        self.assertEqual(password_manager.target_url, protected_url)
1191
1192        # expect one request without authorization, then one with
1193        self.assertEqual(len(http_handler.requests), 2)
1194        self.assertFalse(http_handler.requests[0].has_header(auth_header))
1195        userpass = '%s:%s' % (user, password)
1196        auth_hdr_value = 'Basic '+base64.encodestring(userpass).strip()
1197        self.assertEqual(http_handler.requests[1].get_header(auth_header),
1198                         auth_hdr_value)
1199        self.assertEqual(http_handler.requests[1].unredirected_hdrs[auth_header],
1200                         auth_hdr_value)
1201        # if the password manager can't find a password, the handler won't
1202        # handle the HTTP auth error
1203        password_manager.user = password_manager.password = None
1204        http_handler.reset()
1205        r = opener.open(request_url)
1206        self.assertEqual(len(http_handler.requests), 1)
1207        self.assertFalse(http_handler.requests[0].has_header(auth_header))
1208
1209class MiscTests(unittest.TestCase):
1210
1211    def test_build_opener(self):
1212        class MyHTTPHandler(urllib2.HTTPHandler): pass
1213        class FooHandler(urllib2.BaseHandler):
1214            def foo_open(self): pass
1215        class BarHandler(urllib2.BaseHandler):
1216            def bar_open(self): pass
1217
1218        build_opener = urllib2.build_opener
1219
1220        o = build_opener(FooHandler, BarHandler)
1221        self.opener_has_handler(o, FooHandler)
1222        self.opener_has_handler(o, BarHandler)
1223
1224        # can take a mix of classes and instances
1225        o = build_opener(FooHandler, BarHandler())
1226        self.opener_has_handler(o, FooHandler)
1227        self.opener_has_handler(o, BarHandler)
1228
1229        # subclasses of default handlers override default handlers
1230        o = build_opener(MyHTTPHandler)
1231        self.opener_has_handler(o, MyHTTPHandler)
1232
1233        # a particular case of overriding: default handlers can be passed
1234        # in explicitly
1235        o = build_opener()
1236        self.opener_has_handler(o, urllib2.HTTPHandler)
1237        o = build_opener(urllib2.HTTPHandler)
1238        self.opener_has_handler(o, urllib2.HTTPHandler)
1239        o = build_opener(urllib2.HTTPHandler())
1240        self.opener_has_handler(o, urllib2.HTTPHandler)
1241
1242        # Issue2670: multiple handlers sharing the same base class
1243        class MyOtherHTTPHandler(urllib2.HTTPHandler): pass
1244        o = build_opener(MyHTTPHandler, MyOtherHTTPHandler)
1245        self.opener_has_handler(o, MyHTTPHandler)
1246        self.opener_has_handler(o, MyOtherHTTPHandler)
1247
1248    def opener_has_handler(self, opener, handler_class):
1249        for h in opener.handlers:
1250            if h.__class__ == handler_class:
1251                break
1252        else:
1253            self.assertTrue(False)
1254
1255class RequestTests(unittest.TestCase):
1256
1257    def setUp(self):
1258        self.get = urllib2.Request("http://www.python.org/~jeremy/")
1259        self.post = urllib2.Request("http://www.python.org/~jeremy/",
1260                                    "data",
1261                                    headers={"X-Test": "test"})
1262
1263    def test_method(self):
1264        self.assertEqual("POST", self.post.get_method())
1265        self.assertEqual("GET", self.get.get_method())
1266
1267    def test_add_data(self):
1268        self.assertTrue(not self.get.has_data())
1269        self.assertEqual("GET", self.get.get_method())
1270        self.get.add_data("spam")
1271        self.assertTrue(self.get.has_data())
1272        self.assertEqual("POST", self.get.get_method())
1273
1274    def test_get_full_url(self):
1275        self.assertEqual("http://www.python.org/~jeremy/",
1276                         self.get.get_full_url())
1277
1278    def test_selector(self):
1279        self.assertEqual("/~jeremy/", self.get.get_selector())
1280        req = urllib2.Request("http://www.python.org/")
1281        self.assertEqual("/", req.get_selector())
1282
1283    def test_get_type(self):
1284        self.assertEqual("http", self.get.get_type())
1285
1286    def test_get_host(self):
1287        self.assertEqual("www.python.org", self.get.get_host())
1288
1289    def test_get_host_unquote(self):
1290        req = urllib2.Request("http://www.%70ython.org/")
1291        self.assertEqual("www.python.org", req.get_host())
1292
1293    def test_proxy(self):
1294        self.assertTrue(not self.get.has_proxy())
1295        self.get.set_proxy("www.perl.org", "http")
1296        self.assertTrue(self.get.has_proxy())
1297        self.assertEqual("www.python.org", self.get.get_origin_req_host())
1298        self.assertEqual("www.perl.org", self.get.get_host())
1299
1300    def test_wrapped_url(self):
1301        req = Request("<URL:http://www.python.org>")
1302        self.assertEqual("www.python.org", req.get_host())
1303
1304    def test_url_fragment(self):
1305        req = Request("http://www.python.org/?qs=query#fragment=true")
1306        self.assertEqual("/?qs=query", req.get_selector())
1307        req = Request("http://www.python.org/#fun=true")
1308        self.assertEqual("/", req.get_selector())
1309
1310        # Issue 11703: geturl() omits fragment in the original URL.
1311        url = 'http://docs.python.org/library/urllib2.html#OK'
1312        req = Request(url)
1313        self.assertEqual(req.get_full_url(), url)
1314
1315def test_main(verbose=None):
1316    from test import test_urllib2
1317    test_support.run_doctest(test_urllib2, verbose)
1318    test_support.run_doctest(urllib2, verbose)
1319    tests = (TrivialTests,
1320             OpenerDirectorTests,
1321             HandlerTests,
1322             MiscTests,
1323             RequestTests)
1324    test_support.run_unittest(*tests)
1325
1326if __name__ == "__main__":
1327    test_main(verbose=True)
1328