1"""Regression tests for what was in Python 2's "urllib" module""" 2 3import urllib.parse 4import urllib.request 5import urllib.error 6import http.client 7import email.message 8import io 9import unittest 10from unittest.mock import patch 11from test import support 12import os 13try: 14 import ssl 15except ImportError: 16 ssl = None 17import sys 18import tempfile 19from nturl2path import url2pathname, pathname2url 20 21from base64 import b64encode 22import collections 23 24 25def hexescape(char): 26 """Escape char as RFC 2396 specifies""" 27 hex_repr = hex(ord(char))[2:].upper() 28 if len(hex_repr) == 1: 29 hex_repr = "0%s" % hex_repr 30 return "%" + hex_repr 31 32# Shortcut for testing FancyURLopener 33_urlopener = None 34 35 36def urlopen(url, data=None, proxies=None): 37 """urlopen(url [, data]) -> open file-like object""" 38 global _urlopener 39 if proxies is not None: 40 opener = urllib.request.FancyURLopener(proxies=proxies) 41 elif not _urlopener: 42 opener = FancyURLopener() 43 _urlopener = opener 44 else: 45 opener = _urlopener 46 if data is None: 47 return opener.open(url) 48 else: 49 return opener.open(url, data) 50 51 52def FancyURLopener(): 53 with support.check_warnings( 54 ('FancyURLopener style of invoking requests is deprecated.', 55 DeprecationWarning)): 56 return urllib.request.FancyURLopener() 57 58 59def fakehttp(fakedata, mock_close=False): 60 class FakeSocket(io.BytesIO): 61 io_refs = 1 62 63 def sendall(self, data): 64 FakeHTTPConnection.buf = data 65 66 def makefile(self, *args, **kwds): 67 self.io_refs += 1 68 return self 69 70 def read(self, amt=None): 71 if self.closed: 72 return b"" 73 return io.BytesIO.read(self, amt) 74 75 def readline(self, length=None): 76 if self.closed: 77 return b"" 78 return io.BytesIO.readline(self, length) 79 80 def close(self): 81 self.io_refs -= 1 82 if self.io_refs == 0: 83 io.BytesIO.close(self) 84 85 class FakeHTTPConnection(http.client.HTTPConnection): 86 87 # buffer to store data for verification in urlopen tests. 88 buf = None 89 90 def connect(self): 91 self.sock = FakeSocket(self.fakedata) 92 type(self).fakesock = self.sock 93 94 if mock_close: 95 # bpo-36918: HTTPConnection destructor calls close() which calls 96 # flush(). Problem: flush() calls self.fp.flush() which raises 97 # "ValueError: I/O operation on closed file" which is logged as an 98 # "Exception ignored in". Override close() to silence this error. 99 def close(self): 100 pass 101 FakeHTTPConnection.fakedata = fakedata 102 103 return FakeHTTPConnection 104 105 106class FakeHTTPMixin(object): 107 def fakehttp(self, fakedata, mock_close=False): 108 fake_http_class = fakehttp(fakedata, mock_close=mock_close) 109 self._connection_class = http.client.HTTPConnection 110 http.client.HTTPConnection = fake_http_class 111 112 def unfakehttp(self): 113 http.client.HTTPConnection = self._connection_class 114 115 116class FakeFTPMixin(object): 117 def fakeftp(self): 118 class FakeFtpWrapper(object): 119 def __init__(self, user, passwd, host, port, dirs, timeout=None, 120 persistent=True): 121 pass 122 123 def retrfile(self, file, type): 124 return io.BytesIO(), 0 125 126 def close(self): 127 pass 128 129 self._ftpwrapper_class = urllib.request.ftpwrapper 130 urllib.request.ftpwrapper = FakeFtpWrapper 131 132 def unfakeftp(self): 133 urllib.request.ftpwrapper = self._ftpwrapper_class 134 135 136class urlopen_FileTests(unittest.TestCase): 137 """Test urlopen() opening a temporary file. 138 139 Try to test as much functionality as possible so as to cut down on reliance 140 on connecting to the Net for testing. 141 142 """ 143 144 def setUp(self): 145 # Create a temp file to use for testing 146 self.text = bytes("test_urllib: %s\n" % self.__class__.__name__, 147 "ascii") 148 f = open(support.TESTFN, 'wb') 149 try: 150 f.write(self.text) 151 finally: 152 f.close() 153 self.pathname = support.TESTFN 154 self.returned_obj = urlopen("file:%s" % self.pathname) 155 156 def tearDown(self): 157 """Shut down the open object""" 158 self.returned_obj.close() 159 os.remove(support.TESTFN) 160 161 def test_interface(self): 162 # Make sure object returned by urlopen() has the specified methods 163 for attr in ("read", "readline", "readlines", "fileno", 164 "close", "info", "geturl", "getcode", "__iter__"): 165 self.assertTrue(hasattr(self.returned_obj, attr), 166 "object returned by urlopen() lacks %s attribute" % 167 attr) 168 169 def test_read(self): 170 self.assertEqual(self.text, self.returned_obj.read()) 171 172 def test_readline(self): 173 self.assertEqual(self.text, self.returned_obj.readline()) 174 self.assertEqual(b'', self.returned_obj.readline(), 175 "calling readline() after exhausting the file did not" 176 " return an empty string") 177 178 def test_readlines(self): 179 lines_list = self.returned_obj.readlines() 180 self.assertEqual(len(lines_list), 1, 181 "readlines() returned the wrong number of lines") 182 self.assertEqual(lines_list[0], self.text, 183 "readlines() returned improper text") 184 185 def test_fileno(self): 186 file_num = self.returned_obj.fileno() 187 self.assertIsInstance(file_num, int, "fileno() did not return an int") 188 self.assertEqual(os.read(file_num, len(self.text)), self.text, 189 "Reading on the file descriptor returned by fileno() " 190 "did not return the expected text") 191 192 def test_close(self): 193 # Test close() by calling it here and then having it be called again 194 # by the tearDown() method for the test 195 self.returned_obj.close() 196 197 def test_info(self): 198 self.assertIsInstance(self.returned_obj.info(), email.message.Message) 199 200 def test_geturl(self): 201 self.assertEqual(self.returned_obj.geturl(), self.pathname) 202 203 def test_getcode(self): 204 self.assertIsNone(self.returned_obj.getcode()) 205 206 def test_iter(self): 207 # Test iterator 208 # Don't need to count number of iterations since test would fail the 209 # instant it returned anything beyond the first line from the 210 # comparison. 211 # Use the iterator in the usual implicit way to test for ticket #4608. 212 for line in self.returned_obj: 213 self.assertEqual(line, self.text) 214 215 def test_relativelocalfile(self): 216 self.assertRaises(ValueError,urllib.request.urlopen,'./' + self.pathname) 217 218 219class ProxyTests(unittest.TestCase): 220 221 def setUp(self): 222 # Records changes to env vars 223 self.env = support.EnvironmentVarGuard() 224 # Delete all proxy related env vars 225 for k in list(os.environ): 226 if 'proxy' in k.lower(): 227 self.env.unset(k) 228 229 def tearDown(self): 230 # Restore all proxy related env vars 231 self.env.__exit__() 232 del self.env 233 234 def test_getproxies_environment_keep_no_proxies(self): 235 self.env.set('NO_PROXY', 'localhost') 236 proxies = urllib.request.getproxies_environment() 237 # getproxies_environment use lowered case truncated (no '_proxy') keys 238 self.assertEqual('localhost', proxies['no']) 239 # List of no_proxies with space. 240 self.env.set('NO_PROXY', 'localhost, anotherdomain.com, newdomain.com:1234') 241 self.assertTrue(urllib.request.proxy_bypass_environment('anotherdomain.com')) 242 self.assertTrue(urllib.request.proxy_bypass_environment('anotherdomain.com:8888')) 243 self.assertTrue(urllib.request.proxy_bypass_environment('newdomain.com:1234')) 244 245 def test_proxy_cgi_ignore(self): 246 try: 247 self.env.set('HTTP_PROXY', 'http://somewhere:3128') 248 proxies = urllib.request.getproxies_environment() 249 self.assertEqual('http://somewhere:3128', proxies['http']) 250 self.env.set('REQUEST_METHOD', 'GET') 251 proxies = urllib.request.getproxies_environment() 252 self.assertNotIn('http', proxies) 253 finally: 254 self.env.unset('REQUEST_METHOD') 255 self.env.unset('HTTP_PROXY') 256 257 def test_proxy_bypass_environment_host_match(self): 258 bypass = urllib.request.proxy_bypass_environment 259 self.env.set('NO_PROXY', 260 'localhost, anotherdomain.com, newdomain.com:1234, .d.o.t') 261 self.assertTrue(bypass('localhost')) 262 self.assertTrue(bypass('LocalHost')) # MixedCase 263 self.assertTrue(bypass('LOCALHOST')) # UPPERCASE 264 self.assertTrue(bypass('.localhost')) 265 self.assertTrue(bypass('newdomain.com:1234')) 266 self.assertTrue(bypass('.newdomain.com:1234')) 267 self.assertTrue(bypass('foo.d.o.t')) # issue 29142 268 self.assertTrue(bypass('d.o.t')) 269 self.assertTrue(bypass('anotherdomain.com:8888')) 270 self.assertTrue(bypass('.anotherdomain.com:8888')) 271 self.assertTrue(bypass('www.newdomain.com:1234')) 272 self.assertFalse(bypass('prelocalhost')) 273 self.assertFalse(bypass('newdomain.com')) # no port 274 self.assertFalse(bypass('newdomain.com:1235')) # wrong port 275 276 def test_proxy_bypass_environment_always_match(self): 277 bypass = urllib.request.proxy_bypass_environment 278 self.env.set('NO_PROXY', '*') 279 self.assertTrue(bypass('newdomain.com')) 280 self.assertTrue(bypass('newdomain.com:1234')) 281 self.env.set('NO_PROXY', '*, anotherdomain.com') 282 self.assertTrue(bypass('anotherdomain.com')) 283 self.assertFalse(bypass('newdomain.com')) 284 self.assertFalse(bypass('newdomain.com:1234')) 285 286 def test_proxy_bypass_environment_newline(self): 287 bypass = urllib.request.proxy_bypass_environment 288 self.env.set('NO_PROXY', 289 'localhost, anotherdomain.com, newdomain.com:1234') 290 self.assertFalse(bypass('localhost\n')) 291 self.assertFalse(bypass('anotherdomain.com:8888\n')) 292 self.assertFalse(bypass('newdomain.com:1234\n')) 293 294 295class ProxyTests_withOrderedEnv(unittest.TestCase): 296 297 def setUp(self): 298 # We need to test conditions, where variable order _is_ significant 299 self._saved_env = os.environ 300 # Monkey patch os.environ, start with empty fake environment 301 os.environ = collections.OrderedDict() 302 303 def tearDown(self): 304 os.environ = self._saved_env 305 306 def test_getproxies_environment_prefer_lowercase(self): 307 # Test lowercase preference with removal 308 os.environ['no_proxy'] = '' 309 os.environ['No_Proxy'] = 'localhost' 310 self.assertFalse(urllib.request.proxy_bypass_environment('localhost')) 311 self.assertFalse(urllib.request.proxy_bypass_environment('arbitrary')) 312 os.environ['http_proxy'] = '' 313 os.environ['HTTP_PROXY'] = 'http://somewhere:3128' 314 proxies = urllib.request.getproxies_environment() 315 self.assertEqual({}, proxies) 316 # Test lowercase preference of proxy bypass and correct matching including ports 317 os.environ['no_proxy'] = 'localhost, noproxy.com, my.proxy:1234' 318 os.environ['No_Proxy'] = 'xyz.com' 319 self.assertTrue(urllib.request.proxy_bypass_environment('localhost')) 320 self.assertTrue(urllib.request.proxy_bypass_environment('noproxy.com:5678')) 321 self.assertTrue(urllib.request.proxy_bypass_environment('my.proxy:1234')) 322 self.assertFalse(urllib.request.proxy_bypass_environment('my.proxy')) 323 self.assertFalse(urllib.request.proxy_bypass_environment('arbitrary')) 324 # Test lowercase preference with replacement 325 os.environ['http_proxy'] = 'http://somewhere:3128' 326 os.environ['Http_Proxy'] = 'http://somewhereelse:3128' 327 proxies = urllib.request.getproxies_environment() 328 self.assertEqual('http://somewhere:3128', proxies['http']) 329 330 331class urlopen_HttpTests(unittest.TestCase, FakeHTTPMixin, FakeFTPMixin): 332 """Test urlopen() opening a fake http connection.""" 333 334 def check_read(self, ver): 335 self.fakehttp(b"HTTP/" + ver + b" 200 OK\r\n\r\nHello!") 336 try: 337 fp = urlopen("http://python.org/") 338 self.assertEqual(fp.readline(), b"Hello!") 339 self.assertEqual(fp.readline(), b"") 340 self.assertEqual(fp.geturl(), 'http://python.org/') 341 self.assertEqual(fp.getcode(), 200) 342 finally: 343 self.unfakehttp() 344 345 def test_url_fragment(self): 346 # Issue #11703: geturl() omits fragments in the original URL. 347 url = 'http://docs.python.org/library/urllib.html#OK' 348 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello!") 349 try: 350 fp = urllib.request.urlopen(url) 351 self.assertEqual(fp.geturl(), url) 352 finally: 353 self.unfakehttp() 354 355 def test_willclose(self): 356 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello!") 357 try: 358 resp = urlopen("http://www.python.org") 359 self.assertTrue(resp.fp.will_close) 360 finally: 361 self.unfakehttp() 362 363 @unittest.skipUnless(ssl, "ssl module required") 364 def test_url_path_with_control_char_rejected(self): 365 for char_no in list(range(0, 0x21)) + [0x7f]: 366 char = chr(char_no) 367 schemeless_url = f"//localhost:7777/test{char}/" 368 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello.") 369 try: 370 # We explicitly test urllib.request.urlopen() instead of the top 371 # level 'def urlopen()' function defined in this... (quite ugly) 372 # test suite. They use different url opening codepaths. Plain 373 # urlopen uses FancyURLOpener which goes via a codepath that 374 # calls urllib.parse.quote() on the URL which makes all of the 375 # above attempts at injection within the url _path_ safe. 376 escaped_char_repr = repr(char).replace('\\', r'\\') 377 InvalidURL = http.client.InvalidURL 378 with self.assertRaisesRegex( 379 InvalidURL, f"contain control.*{escaped_char_repr}"): 380 urllib.request.urlopen(f"http:{schemeless_url}") 381 with self.assertRaisesRegex( 382 InvalidURL, f"contain control.*{escaped_char_repr}"): 383 urllib.request.urlopen(f"https:{schemeless_url}") 384 # This code path quotes the URL so there is no injection. 385 resp = urlopen(f"http:{schemeless_url}") 386 self.assertNotIn(char, resp.geturl()) 387 finally: 388 self.unfakehttp() 389 390 @unittest.skipUnless(ssl, "ssl module required") 391 def test_url_path_with_newline_header_injection_rejected(self): 392 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello.") 393 host = "localhost:7777?a=1 HTTP/1.1\r\nX-injected: header\r\nTEST: 123" 394 schemeless_url = "//" + host + ":8080/test/?test=a" 395 try: 396 # We explicitly test urllib.request.urlopen() instead of the top 397 # level 'def urlopen()' function defined in this... (quite ugly) 398 # test suite. They use different url opening codepaths. Plain 399 # urlopen uses FancyURLOpener which goes via a codepath that 400 # calls urllib.parse.quote() on the URL which makes all of the 401 # above attempts at injection within the url _path_ safe. 402 InvalidURL = http.client.InvalidURL 403 with self.assertRaisesRegex( 404 InvalidURL, r"contain control.*\\r.*(found at least . .)"): 405 urllib.request.urlopen(f"http:{schemeless_url}") 406 with self.assertRaisesRegex(InvalidURL, r"contain control.*\\n"): 407 urllib.request.urlopen(f"https:{schemeless_url}") 408 # This code path quotes the URL so there is no injection. 409 resp = urlopen(f"http:{schemeless_url}") 410 self.assertNotIn(' ', resp.geturl()) 411 self.assertNotIn('\r', resp.geturl()) 412 self.assertNotIn('\n', resp.geturl()) 413 finally: 414 self.unfakehttp() 415 416 @unittest.skipUnless(ssl, "ssl module required") 417 def test_url_host_with_control_char_rejected(self): 418 for char_no in list(range(0, 0x21)) + [0x7f]: 419 char = chr(char_no) 420 schemeless_url = f"//localhost{char}/test/" 421 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello.") 422 try: 423 escaped_char_repr = repr(char).replace('\\', r'\\') 424 InvalidURL = http.client.InvalidURL 425 with self.assertRaisesRegex( 426 InvalidURL, f"contain control.*{escaped_char_repr}"): 427 urlopen(f"http:{schemeless_url}") 428 with self.assertRaisesRegex(InvalidURL, f"contain control.*{escaped_char_repr}"): 429 urlopen(f"https:{schemeless_url}") 430 finally: 431 self.unfakehttp() 432 433 @unittest.skipUnless(ssl, "ssl module required") 434 def test_url_host_with_newline_header_injection_rejected(self): 435 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello.") 436 host = "localhost\r\nX-injected: header\r\n" 437 schemeless_url = "//" + host + ":8080/test/?test=a" 438 try: 439 InvalidURL = http.client.InvalidURL 440 with self.assertRaisesRegex( 441 InvalidURL, r"contain control.*\\r"): 442 urlopen(f"http:{schemeless_url}") 443 with self.assertRaisesRegex(InvalidURL, r"contain control.*\\n"): 444 urlopen(f"https:{schemeless_url}") 445 finally: 446 self.unfakehttp() 447 448 def test_read_0_9(self): 449 # "0.9" response accepted (but not "simple responses" without 450 # a status line) 451 self.check_read(b"0.9") 452 453 def test_read_1_0(self): 454 self.check_read(b"1.0") 455 456 def test_read_1_1(self): 457 self.check_read(b"1.1") 458 459 def test_read_bogus(self): 460 # urlopen() should raise OSError for many error codes. 461 self.fakehttp(b'''HTTP/1.1 401 Authentication Required 462Date: Wed, 02 Jan 2008 03:03:54 GMT 463Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e 464Connection: close 465Content-Type: text/html; charset=iso-8859-1 466''', mock_close=True) 467 try: 468 self.assertRaises(OSError, urlopen, "http://python.org/") 469 finally: 470 self.unfakehttp() 471 472 def test_invalid_redirect(self): 473 # urlopen() should raise OSError for many error codes. 474 self.fakehttp(b'''HTTP/1.1 302 Found 475Date: Wed, 02 Jan 2008 03:03:54 GMT 476Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e 477Location: file://guidocomputer.athome.com:/python/license 478Connection: close 479Content-Type: text/html; charset=iso-8859-1 480''', mock_close=True) 481 try: 482 msg = "Redirection to url 'file:" 483 with self.assertRaisesRegex(urllib.error.HTTPError, msg): 484 urlopen("http://python.org/") 485 finally: 486 self.unfakehttp() 487 488 def test_redirect_limit_independent(self): 489 # Ticket #12923: make sure independent requests each use their 490 # own retry limit. 491 for i in range(FancyURLopener().maxtries): 492 self.fakehttp(b'''HTTP/1.1 302 Found 493Location: file://guidocomputer.athome.com:/python/license 494Connection: close 495''', mock_close=True) 496 try: 497 self.assertRaises(urllib.error.HTTPError, urlopen, 498 "http://something") 499 finally: 500 self.unfakehttp() 501 502 def test_empty_socket(self): 503 # urlopen() raises OSError if the underlying socket does not send any 504 # data. (#1680230) 505 self.fakehttp(b'') 506 try: 507 self.assertRaises(OSError, urlopen, "http://something") 508 finally: 509 self.unfakehttp() 510 511 def test_missing_localfile(self): 512 # Test for #10836 513 with self.assertRaises(urllib.error.URLError) as e: 514 urlopen('file://localhost/a/file/which/doesnot/exists.py') 515 self.assertTrue(e.exception.filename) 516 self.assertTrue(e.exception.reason) 517 518 def test_file_notexists(self): 519 fd, tmp_file = tempfile.mkstemp() 520 tmp_fileurl = 'file://localhost/' + tmp_file.replace(os.path.sep, '/') 521 try: 522 self.assertTrue(os.path.exists(tmp_file)) 523 with urlopen(tmp_fileurl) as fobj: 524 self.assertTrue(fobj) 525 finally: 526 os.close(fd) 527 os.unlink(tmp_file) 528 self.assertFalse(os.path.exists(tmp_file)) 529 with self.assertRaises(urllib.error.URLError): 530 urlopen(tmp_fileurl) 531 532 def test_ftp_nohost(self): 533 test_ftp_url = 'ftp:///path' 534 with self.assertRaises(urllib.error.URLError) as e: 535 urlopen(test_ftp_url) 536 self.assertFalse(e.exception.filename) 537 self.assertTrue(e.exception.reason) 538 539 def test_ftp_nonexisting(self): 540 with self.assertRaises(urllib.error.URLError) as e: 541 urlopen('ftp://localhost/a/file/which/doesnot/exists.py') 542 self.assertFalse(e.exception.filename) 543 self.assertTrue(e.exception.reason) 544 545 @patch.object(urllib.request, 'MAXFTPCACHE', 0) 546 def test_ftp_cache_pruning(self): 547 self.fakeftp() 548 try: 549 urllib.request.ftpcache['test'] = urllib.request.ftpwrapper('user', 'pass', 'localhost', 21, []) 550 urlopen('ftp://localhost') 551 finally: 552 self.unfakeftp() 553 554 def test_userpass_inurl(self): 555 self.fakehttp(b"HTTP/1.0 200 OK\r\n\r\nHello!") 556 try: 557 fp = urlopen("http://user:pass@python.org/") 558 self.assertEqual(fp.readline(), b"Hello!") 559 self.assertEqual(fp.readline(), b"") 560 self.assertEqual(fp.geturl(), 'http://user:pass@python.org/') 561 self.assertEqual(fp.getcode(), 200) 562 finally: 563 self.unfakehttp() 564 565 def test_userpass_inurl_w_spaces(self): 566 self.fakehttp(b"HTTP/1.0 200 OK\r\n\r\nHello!") 567 try: 568 userpass = "a b:c d" 569 url = "http://{}@python.org/".format(userpass) 570 fakehttp_wrapper = http.client.HTTPConnection 571 authorization = ("Authorization: Basic %s\r\n" % 572 b64encode(userpass.encode("ASCII")).decode("ASCII")) 573 fp = urlopen(url) 574 # The authorization header must be in place 575 self.assertIn(authorization, fakehttp_wrapper.buf.decode("UTF-8")) 576 self.assertEqual(fp.readline(), b"Hello!") 577 self.assertEqual(fp.readline(), b"") 578 # the spaces are quoted in URL so no match 579 self.assertNotEqual(fp.geturl(), url) 580 self.assertEqual(fp.getcode(), 200) 581 finally: 582 self.unfakehttp() 583 584 def test_URLopener_deprecation(self): 585 with support.check_warnings(('',DeprecationWarning)): 586 urllib.request.URLopener() 587 588 @unittest.skipUnless(ssl, "ssl module required") 589 def test_cafile_and_context(self): 590 context = ssl.create_default_context() 591 with support.check_warnings(('', DeprecationWarning)): 592 with self.assertRaises(ValueError): 593 urllib.request.urlopen( 594 "https://localhost", cafile="/nonexistent/path", context=context 595 ) 596 597 598class urlopen_DataTests(unittest.TestCase): 599 """Test urlopen() opening a data URL.""" 600 601 def setUp(self): 602 # text containing URL special- and unicode-characters 603 self.text = "test data URLs :;,%=& \u00f6 \u00c4 " 604 # 2x1 pixel RGB PNG image with one black and one white pixel 605 self.image = ( 606 b'\x89PNG\r\n\x1a\n\x00\x00\x00\rIHDR\x00\x00\x00\x02\x00\x00\x00' 607 b'\x01\x08\x02\x00\x00\x00{@\xe8\xdd\x00\x00\x00\x01sRGB\x00\xae' 608 b'\xce\x1c\xe9\x00\x00\x00\x0fIDAT\x08\xd7c```\xf8\xff\xff?\x00' 609 b'\x06\x01\x02\xfe\no/\x1e\x00\x00\x00\x00IEND\xaeB`\x82') 610 611 self.text_url = ( 612 "data:text/plain;charset=UTF-8,test%20data%20URLs%20%3A%3B%2C%25%3" 613 "D%26%20%C3%B6%20%C3%84%20") 614 self.text_url_base64 = ( 615 "data:text/plain;charset=ISO-8859-1;base64,dGVzdCBkYXRhIFVSTHMgOjs" 616 "sJT0mIPYgxCA%3D") 617 # base64 encoded data URL that contains ignorable spaces, 618 # such as "\n", " ", "%0A", and "%20". 619 self.image_url = ( 620 "\n" 621 "QOjdAAAAAXNSR0IArs4c6QAAAA9JREFUCNdj%0AYGBg%2BP//PwAGAQL%2BCm8 " 622 "vHgAAAABJRU5ErkJggg%3D%3D%0A%20") 623 624 self.text_url_resp = urllib.request.urlopen(self.text_url) 625 self.text_url_base64_resp = urllib.request.urlopen( 626 self.text_url_base64) 627 self.image_url_resp = urllib.request.urlopen(self.image_url) 628 629 def test_interface(self): 630 # Make sure object returned by urlopen() has the specified methods 631 for attr in ("read", "readline", "readlines", 632 "close", "info", "geturl", "getcode", "__iter__"): 633 self.assertTrue(hasattr(self.text_url_resp, attr), 634 "object returned by urlopen() lacks %s attribute" % 635 attr) 636 637 def test_info(self): 638 self.assertIsInstance(self.text_url_resp.info(), email.message.Message) 639 self.assertEqual(self.text_url_base64_resp.info().get_params(), 640 [('text/plain', ''), ('charset', 'ISO-8859-1')]) 641 self.assertEqual(self.image_url_resp.info()['content-length'], 642 str(len(self.image))) 643 self.assertEqual(urllib.request.urlopen("data:,").info().get_params(), 644 [('text/plain', ''), ('charset', 'US-ASCII')]) 645 646 def test_geturl(self): 647 self.assertEqual(self.text_url_resp.geturl(), self.text_url) 648 self.assertEqual(self.text_url_base64_resp.geturl(), 649 self.text_url_base64) 650 self.assertEqual(self.image_url_resp.geturl(), self.image_url) 651 652 def test_read_text(self): 653 self.assertEqual(self.text_url_resp.read().decode( 654 dict(self.text_url_resp.info().get_params())['charset']), self.text) 655 656 def test_read_text_base64(self): 657 self.assertEqual(self.text_url_base64_resp.read().decode( 658 dict(self.text_url_base64_resp.info().get_params())['charset']), 659 self.text) 660 661 def test_read_image(self): 662 self.assertEqual(self.image_url_resp.read(), self.image) 663 664 def test_missing_comma(self): 665 self.assertRaises(ValueError,urllib.request.urlopen,'data:text/plain') 666 667 def test_invalid_base64_data(self): 668 # missing padding character 669 self.assertRaises(ValueError,urllib.request.urlopen,'data:;base64,Cg=') 670 671 672class urlretrieve_FileTests(unittest.TestCase): 673 """Test urllib.urlretrieve() on local files""" 674 675 def setUp(self): 676 # Create a list of temporary files. Each item in the list is a file 677 # name (absolute path or relative to the current working directory). 678 # All files in this list will be deleted in the tearDown method. Note, 679 # this only helps to makes sure temporary files get deleted, but it 680 # does nothing about trying to close files that may still be open. It 681 # is the responsibility of the developer to properly close files even 682 # when exceptional conditions occur. 683 self.tempFiles = [] 684 685 # Create a temporary file. 686 self.registerFileForCleanUp(support.TESTFN) 687 self.text = b'testing urllib.urlretrieve' 688 try: 689 FILE = open(support.TESTFN, 'wb') 690 FILE.write(self.text) 691 FILE.close() 692 finally: 693 try: FILE.close() 694 except: pass 695 696 def tearDown(self): 697 # Delete the temporary files. 698 for each in self.tempFiles: 699 try: os.remove(each) 700 except: pass 701 702 def constructLocalFileUrl(self, filePath): 703 filePath = os.path.abspath(filePath) 704 try: 705 filePath.encode("utf-8") 706 except UnicodeEncodeError: 707 raise unittest.SkipTest("filePath is not encodable to utf8") 708 return "file://%s" % urllib.request.pathname2url(filePath) 709 710 def createNewTempFile(self, data=b""): 711 """Creates a new temporary file containing the specified data, 712 registers the file for deletion during the test fixture tear down, and 713 returns the absolute path of the file.""" 714 715 newFd, newFilePath = tempfile.mkstemp() 716 try: 717 self.registerFileForCleanUp(newFilePath) 718 newFile = os.fdopen(newFd, "wb") 719 newFile.write(data) 720 newFile.close() 721 finally: 722 try: newFile.close() 723 except: pass 724 return newFilePath 725 726 def registerFileForCleanUp(self, fileName): 727 self.tempFiles.append(fileName) 728 729 def test_basic(self): 730 # Make sure that a local file just gets its own location returned and 731 # a headers value is returned. 732 result = urllib.request.urlretrieve("file:%s" % support.TESTFN) 733 self.assertEqual(result[0], support.TESTFN) 734 self.assertIsInstance(result[1], email.message.Message, 735 "did not get an email.message.Message instance " 736 "as second returned value") 737 738 def test_copy(self): 739 # Test that setting the filename argument works. 740 second_temp = "%s.2" % support.TESTFN 741 self.registerFileForCleanUp(second_temp) 742 result = urllib.request.urlretrieve(self.constructLocalFileUrl( 743 support.TESTFN), second_temp) 744 self.assertEqual(second_temp, result[0]) 745 self.assertTrue(os.path.exists(second_temp), "copy of the file was not " 746 "made") 747 FILE = open(second_temp, 'rb') 748 try: 749 text = FILE.read() 750 FILE.close() 751 finally: 752 try: FILE.close() 753 except: pass 754 self.assertEqual(self.text, text) 755 756 def test_reporthook(self): 757 # Make sure that the reporthook works. 758 def hooktester(block_count, block_read_size, file_size, count_holder=[0]): 759 self.assertIsInstance(block_count, int) 760 self.assertIsInstance(block_read_size, int) 761 self.assertIsInstance(file_size, int) 762 self.assertEqual(block_count, count_holder[0]) 763 count_holder[0] = count_holder[0] + 1 764 second_temp = "%s.2" % support.TESTFN 765 self.registerFileForCleanUp(second_temp) 766 urllib.request.urlretrieve( 767 self.constructLocalFileUrl(support.TESTFN), 768 second_temp, hooktester) 769 770 def test_reporthook_0_bytes(self): 771 # Test on zero length file. Should call reporthook only 1 time. 772 report = [] 773 def hooktester(block_count, block_read_size, file_size, _report=report): 774 _report.append((block_count, block_read_size, file_size)) 775 srcFileName = self.createNewTempFile() 776 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName), 777 support.TESTFN, hooktester) 778 self.assertEqual(len(report), 1) 779 self.assertEqual(report[0][2], 0) 780 781 def test_reporthook_5_bytes(self): 782 # Test on 5 byte file. Should call reporthook only 2 times (once when 783 # the "network connection" is established and once when the block is 784 # read). 785 report = [] 786 def hooktester(block_count, block_read_size, file_size, _report=report): 787 _report.append((block_count, block_read_size, file_size)) 788 srcFileName = self.createNewTempFile(b"x" * 5) 789 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName), 790 support.TESTFN, hooktester) 791 self.assertEqual(len(report), 2) 792 self.assertEqual(report[0][2], 5) 793 self.assertEqual(report[1][2], 5) 794 795 def test_reporthook_8193_bytes(self): 796 # Test on 8193 byte file. Should call reporthook only 3 times (once 797 # when the "network connection" is established, once for the next 8192 798 # bytes, and once for the last byte). 799 report = [] 800 def hooktester(block_count, block_read_size, file_size, _report=report): 801 _report.append((block_count, block_read_size, file_size)) 802 srcFileName = self.createNewTempFile(b"x" * 8193) 803 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName), 804 support.TESTFN, hooktester) 805 self.assertEqual(len(report), 3) 806 self.assertEqual(report[0][2], 8193) 807 self.assertEqual(report[0][1], 8192) 808 self.assertEqual(report[1][1], 8192) 809 self.assertEqual(report[2][1], 8192) 810 811 812class urlretrieve_HttpTests(unittest.TestCase, FakeHTTPMixin): 813 """Test urllib.urlretrieve() using fake http connections""" 814 815 def test_short_content_raises_ContentTooShortError(self): 816 self.fakehttp(b'''HTTP/1.1 200 OK 817Date: Wed, 02 Jan 2008 03:03:54 GMT 818Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e 819Connection: close 820Content-Length: 100 821Content-Type: text/html; charset=iso-8859-1 822 823FF 824''') 825 826 def _reporthook(par1, par2, par3): 827 pass 828 829 with self.assertRaises(urllib.error.ContentTooShortError): 830 try: 831 urllib.request.urlretrieve(support.TEST_HTTP_URL, 832 reporthook=_reporthook) 833 finally: 834 self.unfakehttp() 835 836 def test_short_content_raises_ContentTooShortError_without_reporthook(self): 837 self.fakehttp(b'''HTTP/1.1 200 OK 838Date: Wed, 02 Jan 2008 03:03:54 GMT 839Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e 840Connection: close 841Content-Length: 100 842Content-Type: text/html; charset=iso-8859-1 843 844FF 845''') 846 with self.assertRaises(urllib.error.ContentTooShortError): 847 try: 848 urllib.request.urlretrieve(support.TEST_HTTP_URL) 849 finally: 850 self.unfakehttp() 851 852 853class QuotingTests(unittest.TestCase): 854 r"""Tests for urllib.quote() and urllib.quote_plus() 855 856 According to RFC 3986 (Uniform Resource Identifiers), to escape a 857 character you write it as '%' + <2 character US-ASCII hex value>. 858 The Python code of ``'%' + hex(ord(<character>))[2:]`` escapes a 859 character properly. Case does not matter on the hex letters. 860 861 The various character sets specified are: 862 863 Reserved characters : ";/?:@&=+$," 864 Have special meaning in URIs and must be escaped if not being used for 865 their special meaning 866 Data characters : letters, digits, and "-_.!~*'()" 867 Unreserved and do not need to be escaped; can be, though, if desired 868 Control characters : 0x00 - 0x1F, 0x7F 869 Have no use in URIs so must be escaped 870 space : 0x20 871 Must be escaped 872 Delimiters : '<>#%"' 873 Must be escaped 874 Unwise : "{}|\^[]`" 875 Must be escaped 876 877 """ 878 879 def test_never_quote(self): 880 # Make sure quote() does not quote letters, digits, and "_,.-" 881 do_not_quote = '' .join(["ABCDEFGHIJKLMNOPQRSTUVWXYZ", 882 "abcdefghijklmnopqrstuvwxyz", 883 "0123456789", 884 "_.-~"]) 885 result = urllib.parse.quote(do_not_quote) 886 self.assertEqual(do_not_quote, result, 887 "using quote(): %r != %r" % (do_not_quote, result)) 888 result = urllib.parse.quote_plus(do_not_quote) 889 self.assertEqual(do_not_quote, result, 890 "using quote_plus(): %r != %r" % (do_not_quote, result)) 891 892 def test_default_safe(self): 893 # Test '/' is default value for 'safe' parameter 894 self.assertEqual(urllib.parse.quote.__defaults__[0], '/') 895 896 def test_safe(self): 897 # Test setting 'safe' parameter does what it should do 898 quote_by_default = "<>" 899 result = urllib.parse.quote(quote_by_default, safe=quote_by_default) 900 self.assertEqual(quote_by_default, result, 901 "using quote(): %r != %r" % (quote_by_default, result)) 902 result = urllib.parse.quote_plus(quote_by_default, 903 safe=quote_by_default) 904 self.assertEqual(quote_by_default, result, 905 "using quote_plus(): %r != %r" % 906 (quote_by_default, result)) 907 # Safe expressed as bytes rather than str 908 result = urllib.parse.quote(quote_by_default, safe=b"<>") 909 self.assertEqual(quote_by_default, result, 910 "using quote(): %r != %r" % (quote_by_default, result)) 911 # "Safe" non-ASCII characters should have no effect 912 # (Since URIs are not allowed to have non-ASCII characters) 913 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="\xfc") 914 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="") 915 self.assertEqual(expect, result, 916 "using quote(): %r != %r" % 917 (expect, result)) 918 # Same as above, but using a bytes rather than str 919 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe=b"\xfc") 920 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="") 921 self.assertEqual(expect, result, 922 "using quote(): %r != %r" % 923 (expect, result)) 924 925 def test_default_quoting(self): 926 # Make sure all characters that should be quoted are by default sans 927 # space (separate test for that). 928 should_quote = [chr(num) for num in range(32)] # For 0x00 - 0x1F 929 should_quote.append(r'<>#%"{}|\^[]`') 930 should_quote.append(chr(127)) # For 0x7F 931 should_quote = ''.join(should_quote) 932 for char in should_quote: 933 result = urllib.parse.quote(char) 934 self.assertEqual(hexescape(char), result, 935 "using quote(): " 936 "%s should be escaped to %s, not %s" % 937 (char, hexescape(char), result)) 938 result = urllib.parse.quote_plus(char) 939 self.assertEqual(hexescape(char), result, 940 "using quote_plus(): " 941 "%s should be escapes to %s, not %s" % 942 (char, hexescape(char), result)) 943 del should_quote 944 partial_quote = "ab[]cd" 945 expected = "ab%5B%5Dcd" 946 result = urllib.parse.quote(partial_quote) 947 self.assertEqual(expected, result, 948 "using quote(): %r != %r" % (expected, result)) 949 result = urllib.parse.quote_plus(partial_quote) 950 self.assertEqual(expected, result, 951 "using quote_plus(): %r != %r" % (expected, result)) 952 953 def test_quoting_space(self): 954 # Make sure quote() and quote_plus() handle spaces as specified in 955 # their unique way 956 result = urllib.parse.quote(' ') 957 self.assertEqual(result, hexescape(' '), 958 "using quote(): %r != %r" % (result, hexescape(' '))) 959 result = urllib.parse.quote_plus(' ') 960 self.assertEqual(result, '+', 961 "using quote_plus(): %r != +" % result) 962 given = "a b cd e f" 963 expect = given.replace(' ', hexescape(' ')) 964 result = urllib.parse.quote(given) 965 self.assertEqual(expect, result, 966 "using quote(): %r != %r" % (expect, result)) 967 expect = given.replace(' ', '+') 968 result = urllib.parse.quote_plus(given) 969 self.assertEqual(expect, result, 970 "using quote_plus(): %r != %r" % (expect, result)) 971 972 def test_quoting_plus(self): 973 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma'), 974 'alpha%2Bbeta+gamma') 975 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', '+'), 976 'alpha+beta+gamma') 977 # Test with bytes 978 self.assertEqual(urllib.parse.quote_plus(b'alpha+beta gamma'), 979 'alpha%2Bbeta+gamma') 980 # Test with safe bytes 981 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', b'+'), 982 'alpha+beta+gamma') 983 984 def test_quote_bytes(self): 985 # Bytes should quote directly to percent-encoded values 986 given = b"\xa2\xd8ab\xff" 987 expect = "%A2%D8ab%FF" 988 result = urllib.parse.quote(given) 989 self.assertEqual(expect, result, 990 "using quote(): %r != %r" % (expect, result)) 991 # Encoding argument should raise type error on bytes input 992 self.assertRaises(TypeError, urllib.parse.quote, given, 993 encoding="latin-1") 994 # quote_from_bytes should work the same 995 result = urllib.parse.quote_from_bytes(given) 996 self.assertEqual(expect, result, 997 "using quote_from_bytes(): %r != %r" 998 % (expect, result)) 999 1000 def test_quote_with_unicode(self): 1001 # Characters in Latin-1 range, encoded by default in UTF-8 1002 given = "\xa2\xd8ab\xff" 1003 expect = "%C2%A2%C3%98ab%C3%BF" 1004 result = urllib.parse.quote(given) 1005 self.assertEqual(expect, result, 1006 "using quote(): %r != %r" % (expect, result)) 1007 # Characters in Latin-1 range, encoded by with None (default) 1008 result = urllib.parse.quote(given, encoding=None, errors=None) 1009 self.assertEqual(expect, result, 1010 "using quote(): %r != %r" % (expect, result)) 1011 # Characters in Latin-1 range, encoded with Latin-1 1012 given = "\xa2\xd8ab\xff" 1013 expect = "%A2%D8ab%FF" 1014 result = urllib.parse.quote(given, encoding="latin-1") 1015 self.assertEqual(expect, result, 1016 "using quote(): %r != %r" % (expect, result)) 1017 # Characters in BMP, encoded by default in UTF-8 1018 given = "\u6f22\u5b57" # "Kanji" 1019 expect = "%E6%BC%A2%E5%AD%97" 1020 result = urllib.parse.quote(given) 1021 self.assertEqual(expect, result, 1022 "using quote(): %r != %r" % (expect, result)) 1023 # Characters in BMP, encoded with Latin-1 1024 given = "\u6f22\u5b57" 1025 self.assertRaises(UnicodeEncodeError, urllib.parse.quote, given, 1026 encoding="latin-1") 1027 # Characters in BMP, encoded with Latin-1, with replace error handling 1028 given = "\u6f22\u5b57" 1029 expect = "%3F%3F" # "??" 1030 result = urllib.parse.quote(given, encoding="latin-1", 1031 errors="replace") 1032 self.assertEqual(expect, result, 1033 "using quote(): %r != %r" % (expect, result)) 1034 # Characters in BMP, Latin-1, with xmlcharref error handling 1035 given = "\u6f22\u5b57" 1036 expect = "%26%2328450%3B%26%2323383%3B" # "漢字" 1037 result = urllib.parse.quote(given, encoding="latin-1", 1038 errors="xmlcharrefreplace") 1039 self.assertEqual(expect, result, 1040 "using quote(): %r != %r" % (expect, result)) 1041 1042 def test_quote_plus_with_unicode(self): 1043 # Encoding (latin-1) test for quote_plus 1044 given = "\xa2\xd8 \xff" 1045 expect = "%A2%D8+%FF" 1046 result = urllib.parse.quote_plus(given, encoding="latin-1") 1047 self.assertEqual(expect, result, 1048 "using quote_plus(): %r != %r" % (expect, result)) 1049 # Errors test for quote_plus 1050 given = "ab\u6f22\u5b57 cd" 1051 expect = "ab%3F%3F+cd" 1052 result = urllib.parse.quote_plus(given, encoding="latin-1", 1053 errors="replace") 1054 self.assertEqual(expect, result, 1055 "using quote_plus(): %r != %r" % (expect, result)) 1056 1057 1058class UnquotingTests(unittest.TestCase): 1059 """Tests for unquote() and unquote_plus() 1060 1061 See the doc string for quoting_Tests for details on quoting and such. 1062 1063 """ 1064 1065 def test_unquoting(self): 1066 # Make sure unquoting of all ASCII values works 1067 escape_list = [] 1068 for num in range(128): 1069 given = hexescape(chr(num)) 1070 expect = chr(num) 1071 result = urllib.parse.unquote(given) 1072 self.assertEqual(expect, result, 1073 "using unquote(): %r != %r" % (expect, result)) 1074 result = urllib.parse.unquote_plus(given) 1075 self.assertEqual(expect, result, 1076 "using unquote_plus(): %r != %r" % 1077 (expect, result)) 1078 escape_list.append(given) 1079 escape_string = ''.join(escape_list) 1080 del escape_list 1081 result = urllib.parse.unquote(escape_string) 1082 self.assertEqual(result.count('%'), 1, 1083 "using unquote(): not all characters escaped: " 1084 "%s" % result) 1085 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, None) 1086 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, ()) 1087 with support.check_warnings(('', BytesWarning), quiet=True): 1088 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, b'') 1089 1090 def test_unquoting_badpercent(self): 1091 # Test unquoting on bad percent-escapes 1092 given = '%xab' 1093 expect = given 1094 result = urllib.parse.unquote(given) 1095 self.assertEqual(expect, result, "using unquote(): %r != %r" 1096 % (expect, result)) 1097 given = '%x' 1098 expect = given 1099 result = urllib.parse.unquote(given) 1100 self.assertEqual(expect, result, "using unquote(): %r != %r" 1101 % (expect, result)) 1102 given = '%' 1103 expect = given 1104 result = urllib.parse.unquote(given) 1105 self.assertEqual(expect, result, "using unquote(): %r != %r" 1106 % (expect, result)) 1107 # unquote_to_bytes 1108 given = '%xab' 1109 expect = bytes(given, 'ascii') 1110 result = urllib.parse.unquote_to_bytes(given) 1111 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r" 1112 % (expect, result)) 1113 given = '%x' 1114 expect = bytes(given, 'ascii') 1115 result = urllib.parse.unquote_to_bytes(given) 1116 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r" 1117 % (expect, result)) 1118 given = '%' 1119 expect = bytes(given, 'ascii') 1120 result = urllib.parse.unquote_to_bytes(given) 1121 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r" 1122 % (expect, result)) 1123 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, None) 1124 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, ()) 1125 1126 def test_unquoting_mixed_case(self): 1127 # Test unquoting on mixed-case hex digits in the percent-escapes 1128 given = '%Ab%eA' 1129 expect = b'\xab\xea' 1130 result = urllib.parse.unquote_to_bytes(given) 1131 self.assertEqual(expect, result, 1132 "using unquote_to_bytes(): %r != %r" 1133 % (expect, result)) 1134 1135 def test_unquoting_parts(self): 1136 # Make sure unquoting works when have non-quoted characters 1137 # interspersed 1138 given = 'ab%sd' % hexescape('c') 1139 expect = "abcd" 1140 result = urllib.parse.unquote(given) 1141 self.assertEqual(expect, result, 1142 "using quote(): %r != %r" % (expect, result)) 1143 result = urllib.parse.unquote_plus(given) 1144 self.assertEqual(expect, result, 1145 "using unquote_plus(): %r != %r" % (expect, result)) 1146 1147 def test_unquoting_plus(self): 1148 # Test difference between unquote() and unquote_plus() 1149 given = "are+there+spaces..." 1150 expect = given 1151 result = urllib.parse.unquote(given) 1152 self.assertEqual(expect, result, 1153 "using unquote(): %r != %r" % (expect, result)) 1154 expect = given.replace('+', ' ') 1155 result = urllib.parse.unquote_plus(given) 1156 self.assertEqual(expect, result, 1157 "using unquote_plus(): %r != %r" % (expect, result)) 1158 1159 def test_unquote_to_bytes(self): 1160 given = 'br%C3%BCckner_sapporo_20050930.doc' 1161 expect = b'br\xc3\xbcckner_sapporo_20050930.doc' 1162 result = urllib.parse.unquote_to_bytes(given) 1163 self.assertEqual(expect, result, 1164 "using unquote_to_bytes(): %r != %r" 1165 % (expect, result)) 1166 # Test on a string with unescaped non-ASCII characters 1167 # (Technically an invalid URI; expect those characters to be UTF-8 1168 # encoded). 1169 result = urllib.parse.unquote_to_bytes("\u6f22%C3%BC") 1170 expect = b'\xe6\xbc\xa2\xc3\xbc' # UTF-8 for "\u6f22\u00fc" 1171 self.assertEqual(expect, result, 1172 "using unquote_to_bytes(): %r != %r" 1173 % (expect, result)) 1174 # Test with a bytes as input 1175 given = b'%A2%D8ab%FF' 1176 expect = b'\xa2\xd8ab\xff' 1177 result = urllib.parse.unquote_to_bytes(given) 1178 self.assertEqual(expect, result, 1179 "using unquote_to_bytes(): %r != %r" 1180 % (expect, result)) 1181 # Test with a bytes as input, with unescaped non-ASCII bytes 1182 # (Technically an invalid URI; expect those bytes to be preserved) 1183 given = b'%A2\xd8ab%FF' 1184 expect = b'\xa2\xd8ab\xff' 1185 result = urllib.parse.unquote_to_bytes(given) 1186 self.assertEqual(expect, result, 1187 "using unquote_to_bytes(): %r != %r" 1188 % (expect, result)) 1189 1190 def test_unquote_with_unicode(self): 1191 # Characters in the Latin-1 range, encoded with UTF-8 1192 given = 'br%C3%BCckner_sapporo_20050930.doc' 1193 expect = 'br\u00fcckner_sapporo_20050930.doc' 1194 result = urllib.parse.unquote(given) 1195 self.assertEqual(expect, result, 1196 "using unquote(): %r != %r" % (expect, result)) 1197 # Characters in the Latin-1 range, encoded with None (default) 1198 result = urllib.parse.unquote(given, encoding=None, errors=None) 1199 self.assertEqual(expect, result, 1200 "using unquote(): %r != %r" % (expect, result)) 1201 1202 # Characters in the Latin-1 range, encoded with Latin-1 1203 result = urllib.parse.unquote('br%FCckner_sapporo_20050930.doc', 1204 encoding="latin-1") 1205 expect = 'br\u00fcckner_sapporo_20050930.doc' 1206 self.assertEqual(expect, result, 1207 "using unquote(): %r != %r" % (expect, result)) 1208 1209 # Characters in BMP, encoded with UTF-8 1210 given = "%E6%BC%A2%E5%AD%97" 1211 expect = "\u6f22\u5b57" # "Kanji" 1212 result = urllib.parse.unquote(given) 1213 self.assertEqual(expect, result, 1214 "using unquote(): %r != %r" % (expect, result)) 1215 1216 # Decode with UTF-8, invalid sequence 1217 given = "%F3%B1" 1218 expect = "\ufffd" # Replacement character 1219 result = urllib.parse.unquote(given) 1220 self.assertEqual(expect, result, 1221 "using unquote(): %r != %r" % (expect, result)) 1222 1223 # Decode with UTF-8, invalid sequence, replace errors 1224 result = urllib.parse.unquote(given, errors="replace") 1225 self.assertEqual(expect, result, 1226 "using unquote(): %r != %r" % (expect, result)) 1227 1228 # Decode with UTF-8, invalid sequence, ignoring errors 1229 given = "%F3%B1" 1230 expect = "" 1231 result = urllib.parse.unquote(given, errors="ignore") 1232 self.assertEqual(expect, result, 1233 "using unquote(): %r != %r" % (expect, result)) 1234 1235 # A mix of non-ASCII and percent-encoded characters, UTF-8 1236 result = urllib.parse.unquote("\u6f22%C3%BC") 1237 expect = '\u6f22\u00fc' 1238 self.assertEqual(expect, result, 1239 "using unquote(): %r != %r" % (expect, result)) 1240 1241 # A mix of non-ASCII and percent-encoded characters, Latin-1 1242 # (Note, the string contains non-Latin-1-representable characters) 1243 result = urllib.parse.unquote("\u6f22%FC", encoding="latin-1") 1244 expect = '\u6f22\u00fc' 1245 self.assertEqual(expect, result, 1246 "using unquote(): %r != %r" % (expect, result)) 1247 1248 def test_unquoting_with_bytes_input(self): 1249 # Bytes not supported yet 1250 with self.assertRaisesRegex(TypeError, 'Expected str, got bytes'): 1251 given = b'bl\xc3\xa5b\xc3\xa6rsyltet\xc3\xb8y' 1252 urllib.parse.unquote(given) 1253 1254class urlencode_Tests(unittest.TestCase): 1255 """Tests for urlencode()""" 1256 1257 def help_inputtype(self, given, test_type): 1258 """Helper method for testing different input types. 1259 1260 'given' must lead to only the pairs: 1261 * 1st, 1 1262 * 2nd, 2 1263 * 3rd, 3 1264 1265 Test cannot assume anything about order. Docs make no guarantee and 1266 have possible dictionary input. 1267 1268 """ 1269 expect_somewhere = ["1st=1", "2nd=2", "3rd=3"] 1270 result = urllib.parse.urlencode(given) 1271 for expected in expect_somewhere: 1272 self.assertIn(expected, result, 1273 "testing %s: %s not found in %s" % 1274 (test_type, expected, result)) 1275 self.assertEqual(result.count('&'), 2, 1276 "testing %s: expected 2 '&'s; got %s" % 1277 (test_type, result.count('&'))) 1278 amp_location = result.index('&') 1279 on_amp_left = result[amp_location - 1] 1280 on_amp_right = result[amp_location + 1] 1281 self.assertTrue(on_amp_left.isdigit() and on_amp_right.isdigit(), 1282 "testing %s: '&' not located in proper place in %s" % 1283 (test_type, result)) 1284 self.assertEqual(len(result), (5 * 3) + 2, #5 chars per thing and amps 1285 "testing %s: " 1286 "unexpected number of characters: %s != %s" % 1287 (test_type, len(result), (5 * 3) + 2)) 1288 1289 def test_using_mapping(self): 1290 # Test passing in a mapping object as an argument. 1291 self.help_inputtype({"1st":'1', "2nd":'2', "3rd":'3'}, 1292 "using dict as input type") 1293 1294 def test_using_sequence(self): 1295 # Test passing in a sequence of two-item sequences as an argument. 1296 self.help_inputtype([('1st', '1'), ('2nd', '2'), ('3rd', '3')], 1297 "using sequence of two-item tuples as input") 1298 1299 def test_quoting(self): 1300 # Make sure keys and values are quoted using quote_plus() 1301 given = {"&":"="} 1302 expect = "%s=%s" % (hexescape('&'), hexescape('=')) 1303 result = urllib.parse.urlencode(given) 1304 self.assertEqual(expect, result) 1305 given = {"key name":"A bunch of pluses"} 1306 expect = "key+name=A+bunch+of+pluses" 1307 result = urllib.parse.urlencode(given) 1308 self.assertEqual(expect, result) 1309 1310 def test_doseq(self): 1311 # Test that passing True for 'doseq' parameter works correctly 1312 given = {'sequence':['1', '2', '3']} 1313 expect = "sequence=%s" % urllib.parse.quote_plus(str(['1', '2', '3'])) 1314 result = urllib.parse.urlencode(given) 1315 self.assertEqual(expect, result) 1316 result = urllib.parse.urlencode(given, True) 1317 for value in given["sequence"]: 1318 expect = "sequence=%s" % value 1319 self.assertIn(expect, result) 1320 self.assertEqual(result.count('&'), 2, 1321 "Expected 2 '&'s, got %s" % result.count('&')) 1322 1323 def test_empty_sequence(self): 1324 self.assertEqual("", urllib.parse.urlencode({})) 1325 self.assertEqual("", urllib.parse.urlencode([])) 1326 1327 def test_nonstring_values(self): 1328 self.assertEqual("a=1", urllib.parse.urlencode({"a": 1})) 1329 self.assertEqual("a=None", urllib.parse.urlencode({"a": None})) 1330 1331 def test_nonstring_seq_values(self): 1332 self.assertEqual("a=1&a=2", urllib.parse.urlencode({"a": [1, 2]}, True)) 1333 self.assertEqual("a=None&a=a", 1334 urllib.parse.urlencode({"a": [None, "a"]}, True)) 1335 data = collections.OrderedDict([("a", 1), ("b", 1)]) 1336 self.assertEqual("a=a&a=b", 1337 urllib.parse.urlencode({"a": data}, True)) 1338 1339 def test_urlencode_encoding(self): 1340 # ASCII encoding. Expect %3F with errors="replace' 1341 given = (('\u00a0', '\u00c1'),) 1342 expect = '%3F=%3F' 1343 result = urllib.parse.urlencode(given, encoding="ASCII", errors="replace") 1344 self.assertEqual(expect, result) 1345 1346 # Default is UTF-8 encoding. 1347 given = (('\u00a0', '\u00c1'),) 1348 expect = '%C2%A0=%C3%81' 1349 result = urllib.parse.urlencode(given) 1350 self.assertEqual(expect, result) 1351 1352 # Latin-1 encoding. 1353 given = (('\u00a0', '\u00c1'),) 1354 expect = '%A0=%C1' 1355 result = urllib.parse.urlencode(given, encoding="latin-1") 1356 self.assertEqual(expect, result) 1357 1358 def test_urlencode_encoding_doseq(self): 1359 # ASCII Encoding. Expect %3F with errors="replace' 1360 given = (('\u00a0', '\u00c1'),) 1361 expect = '%3F=%3F' 1362 result = urllib.parse.urlencode(given, doseq=True, 1363 encoding="ASCII", errors="replace") 1364 self.assertEqual(expect, result) 1365 1366 # ASCII Encoding. On a sequence of values. 1367 given = (("\u00a0", (1, "\u00c1")),) 1368 expect = '%3F=1&%3F=%3F' 1369 result = urllib.parse.urlencode(given, True, 1370 encoding="ASCII", errors="replace") 1371 self.assertEqual(expect, result) 1372 1373 # Utf-8 1374 given = (("\u00a0", "\u00c1"),) 1375 expect = '%C2%A0=%C3%81' 1376 result = urllib.parse.urlencode(given, True) 1377 self.assertEqual(expect, result) 1378 1379 given = (("\u00a0", (42, "\u00c1")),) 1380 expect = '%C2%A0=42&%C2%A0=%C3%81' 1381 result = urllib.parse.urlencode(given, True) 1382 self.assertEqual(expect, result) 1383 1384 # latin-1 1385 given = (("\u00a0", "\u00c1"),) 1386 expect = '%A0=%C1' 1387 result = urllib.parse.urlencode(given, True, encoding="latin-1") 1388 self.assertEqual(expect, result) 1389 1390 given = (("\u00a0", (42, "\u00c1")),) 1391 expect = '%A0=42&%A0=%C1' 1392 result = urllib.parse.urlencode(given, True, encoding="latin-1") 1393 self.assertEqual(expect, result) 1394 1395 def test_urlencode_bytes(self): 1396 given = ((b'\xa0\x24', b'\xc1\x24'),) 1397 expect = '%A0%24=%C1%24' 1398 result = urllib.parse.urlencode(given) 1399 self.assertEqual(expect, result) 1400 result = urllib.parse.urlencode(given, True) 1401 self.assertEqual(expect, result) 1402 1403 # Sequence of values 1404 given = ((b'\xa0\x24', (42, b'\xc1\x24')),) 1405 expect = '%A0%24=42&%A0%24=%C1%24' 1406 result = urllib.parse.urlencode(given, True) 1407 self.assertEqual(expect, result) 1408 1409 def test_urlencode_encoding_safe_parameter(self): 1410 1411 # Send '$' (\x24) as safe character 1412 # Default utf-8 encoding 1413 1414 given = ((b'\xa0\x24', b'\xc1\x24'),) 1415 result = urllib.parse.urlencode(given, safe=":$") 1416 expect = '%A0$=%C1$' 1417 self.assertEqual(expect, result) 1418 1419 given = ((b'\xa0\x24', b'\xc1\x24'),) 1420 result = urllib.parse.urlencode(given, doseq=True, safe=":$") 1421 expect = '%A0$=%C1$' 1422 self.assertEqual(expect, result) 1423 1424 # Safe parameter in sequence 1425 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),) 1426 expect = '%A0$=%C1$&%A0$=13&%A0$=42' 1427 result = urllib.parse.urlencode(given, True, safe=":$") 1428 self.assertEqual(expect, result) 1429 1430 # Test all above in latin-1 encoding 1431 1432 given = ((b'\xa0\x24', b'\xc1\x24'),) 1433 result = urllib.parse.urlencode(given, safe=":$", 1434 encoding="latin-1") 1435 expect = '%A0$=%C1$' 1436 self.assertEqual(expect, result) 1437 1438 given = ((b'\xa0\x24', b'\xc1\x24'),) 1439 expect = '%A0$=%C1$' 1440 result = urllib.parse.urlencode(given, doseq=True, safe=":$", 1441 encoding="latin-1") 1442 1443 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),) 1444 expect = '%A0$=%C1$&%A0$=13&%A0$=42' 1445 result = urllib.parse.urlencode(given, True, safe=":$", 1446 encoding="latin-1") 1447 self.assertEqual(expect, result) 1448 1449class Pathname_Tests(unittest.TestCase): 1450 """Test pathname2url() and url2pathname()""" 1451 1452 def test_basic(self): 1453 # Make sure simple tests pass 1454 expected_path = os.path.join("parts", "of", "a", "path") 1455 expected_url = "parts/of/a/path" 1456 result = urllib.request.pathname2url(expected_path) 1457 self.assertEqual(expected_url, result, 1458 "pathname2url() failed; %s != %s" % 1459 (result, expected_url)) 1460 result = urllib.request.url2pathname(expected_url) 1461 self.assertEqual(expected_path, result, 1462 "url2pathame() failed; %s != %s" % 1463 (result, expected_path)) 1464 1465 def test_quoting(self): 1466 # Test automatic quoting and unquoting works for pathnam2url() and 1467 # url2pathname() respectively 1468 given = os.path.join("needs", "quot=ing", "here") 1469 expect = "needs/%s/here" % urllib.parse.quote("quot=ing") 1470 result = urllib.request.pathname2url(given) 1471 self.assertEqual(expect, result, 1472 "pathname2url() failed; %s != %s" % 1473 (expect, result)) 1474 expect = given 1475 result = urllib.request.url2pathname(result) 1476 self.assertEqual(expect, result, 1477 "url2pathname() failed; %s != %s" % 1478 (expect, result)) 1479 given = os.path.join("make sure", "using_quote") 1480 expect = "%s/using_quote" % urllib.parse.quote("make sure") 1481 result = urllib.request.pathname2url(given) 1482 self.assertEqual(expect, result, 1483 "pathname2url() failed; %s != %s" % 1484 (expect, result)) 1485 given = "make+sure/using_unquote" 1486 expect = os.path.join("make+sure", "using_unquote") 1487 result = urllib.request.url2pathname(given) 1488 self.assertEqual(expect, result, 1489 "url2pathname() failed; %s != %s" % 1490 (expect, result)) 1491 1492 @unittest.skipUnless(sys.platform == 'win32', 1493 'test specific to the nturl2path functions.') 1494 def test_prefixes(self): 1495 # Test special prefixes are correctly handled in pathname2url() 1496 given = '\\\\?\\C:\\dir' 1497 expect = '///C:/dir' 1498 result = urllib.request.pathname2url(given) 1499 self.assertEqual(expect, result, 1500 "pathname2url() failed; %s != %s" % 1501 (expect, result)) 1502 given = '\\\\?\\unc\\server\\share\\dir' 1503 expect = '/server/share/dir' 1504 result = urllib.request.pathname2url(given) 1505 self.assertEqual(expect, result, 1506 "pathname2url() failed; %s != %s" % 1507 (expect, result)) 1508 1509 1510 @unittest.skipUnless(sys.platform == 'win32', 1511 'test specific to the urllib.url2path function.') 1512 def test_ntpath(self): 1513 given = ('/C:/', '///C:/', '/C|//') 1514 expect = 'C:\\' 1515 for url in given: 1516 result = urllib.request.url2pathname(url) 1517 self.assertEqual(expect, result, 1518 'urllib.request..url2pathname() failed; %s != %s' % 1519 (expect, result)) 1520 given = '///C|/path' 1521 expect = 'C:\\path' 1522 result = urllib.request.url2pathname(given) 1523 self.assertEqual(expect, result, 1524 'urllib.request.url2pathname() failed; %s != %s' % 1525 (expect, result)) 1526 1527class Utility_Tests(unittest.TestCase): 1528 """Testcase to test the various utility functions in the urllib.""" 1529 1530 def test_thishost(self): 1531 """Test the urllib.request.thishost utility function returns a tuple""" 1532 self.assertIsInstance(urllib.request.thishost(), tuple) 1533 1534 1535class URLopener_Tests(FakeHTTPMixin, unittest.TestCase): 1536 """Testcase to test the open method of URLopener class.""" 1537 1538 def test_quoted_open(self): 1539 class DummyURLopener(urllib.request.URLopener): 1540 def open_spam(self, url): 1541 return url 1542 with support.check_warnings( 1543 ('DummyURLopener style of invoking requests is deprecated.', 1544 DeprecationWarning)): 1545 self.assertEqual(DummyURLopener().open( 1546 'spam://example/ /'),'//example/%20/') 1547 1548 # test the safe characters are not quoted by urlopen 1549 self.assertEqual(DummyURLopener().open( 1550 "spam://c:|windows%/:=&?~#+!$,;'@()*[]|/path/"), 1551 "//c:|windows%/:=&?~#+!$,;'@()*[]|/path/") 1552 1553 @support.ignore_warnings(category=DeprecationWarning) 1554 def test_urlopener_retrieve_file(self): 1555 with support.temp_dir() as tmpdir: 1556 fd, tmpfile = tempfile.mkstemp(dir=tmpdir) 1557 os.close(fd) 1558 fileurl = "file:" + urllib.request.pathname2url(tmpfile) 1559 filename, _ = urllib.request.URLopener().retrieve(fileurl) 1560 # Some buildbots have TEMP folder that uses a lowercase drive letter. 1561 self.assertEqual(os.path.normcase(filename), os.path.normcase(tmpfile)) 1562 1563 @support.ignore_warnings(category=DeprecationWarning) 1564 def test_urlopener_retrieve_remote(self): 1565 url = "http://www.python.org/file.txt" 1566 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello!") 1567 self.addCleanup(self.unfakehttp) 1568 filename, _ = urllib.request.URLopener().retrieve(url) 1569 self.assertEqual(os.path.splitext(filename)[1], ".txt") 1570 1571 @support.ignore_warnings(category=DeprecationWarning) 1572 def test_local_file_open(self): 1573 # bpo-35907, CVE-2019-9948: urllib must reject local_file:// scheme 1574 class DummyURLopener(urllib.request.URLopener): 1575 def open_local_file(self, url): 1576 return url 1577 for url in ('local_file://example', 'local-file://example'): 1578 self.assertRaises(OSError, urllib.request.urlopen, url) 1579 self.assertRaises(OSError, urllib.request.URLopener().open, url) 1580 self.assertRaises(OSError, urllib.request.URLopener().retrieve, url) 1581 self.assertRaises(OSError, DummyURLopener().open, url) 1582 self.assertRaises(OSError, DummyURLopener().retrieve, url) 1583 1584 1585# Just commented them out. 1586# Can't really tell why keep failing in windows and sparc. 1587# Everywhere else they work ok, but on those machines, sometimes 1588# fail in one of the tests, sometimes in other. I have a linux, and 1589# the tests go ok. 1590# If anybody has one of the problematic environments, please help! 1591# . Facundo 1592# 1593# def server(evt): 1594# import socket, time 1595# serv = socket.socket(socket.AF_INET, socket.SOCK_STREAM) 1596# serv.settimeout(3) 1597# serv.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1) 1598# serv.bind(("", 9093)) 1599# serv.listen() 1600# try: 1601# conn, addr = serv.accept() 1602# conn.send("1 Hola mundo\n") 1603# cantdata = 0 1604# while cantdata < 13: 1605# data = conn.recv(13-cantdata) 1606# cantdata += len(data) 1607# time.sleep(.3) 1608# conn.send("2 No more lines\n") 1609# conn.close() 1610# except socket.timeout: 1611# pass 1612# finally: 1613# serv.close() 1614# evt.set() 1615# 1616# class FTPWrapperTests(unittest.TestCase): 1617# 1618# def setUp(self): 1619# import ftplib, time, threading 1620# ftplib.FTP.port = 9093 1621# self.evt = threading.Event() 1622# threading.Thread(target=server, args=(self.evt,)).start() 1623# time.sleep(.1) 1624# 1625# def tearDown(self): 1626# self.evt.wait() 1627# 1628# def testBasic(self): 1629# # connects 1630# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, []) 1631# ftp.close() 1632# 1633# def testTimeoutNone(self): 1634# # global default timeout is ignored 1635# import socket 1636# self.assertIsNone(socket.getdefaulttimeout()) 1637# socket.setdefaulttimeout(30) 1638# try: 1639# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, []) 1640# finally: 1641# socket.setdefaulttimeout(None) 1642# self.assertEqual(ftp.ftp.sock.gettimeout(), 30) 1643# ftp.close() 1644# 1645# def testTimeoutDefault(self): 1646# # global default timeout is used 1647# import socket 1648# self.assertIsNone(socket.getdefaulttimeout()) 1649# socket.setdefaulttimeout(30) 1650# try: 1651# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, []) 1652# finally: 1653# socket.setdefaulttimeout(None) 1654# self.assertEqual(ftp.ftp.sock.gettimeout(), 30) 1655# ftp.close() 1656# 1657# def testTimeoutValue(self): 1658# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [], 1659# timeout=30) 1660# self.assertEqual(ftp.ftp.sock.gettimeout(), 30) 1661# ftp.close() 1662 1663 1664class RequestTests(unittest.TestCase): 1665 """Unit tests for urllib.request.Request.""" 1666 1667 def test_default_values(self): 1668 Request = urllib.request.Request 1669 request = Request("http://www.python.org") 1670 self.assertEqual(request.get_method(), 'GET') 1671 request = Request("http://www.python.org", {}) 1672 self.assertEqual(request.get_method(), 'POST') 1673 1674 def test_with_method_arg(self): 1675 Request = urllib.request.Request 1676 request = Request("http://www.python.org", method='HEAD') 1677 self.assertEqual(request.method, 'HEAD') 1678 self.assertEqual(request.get_method(), 'HEAD') 1679 request = Request("http://www.python.org", {}, method='HEAD') 1680 self.assertEqual(request.method, 'HEAD') 1681 self.assertEqual(request.get_method(), 'HEAD') 1682 request = Request("http://www.python.org", method='GET') 1683 self.assertEqual(request.get_method(), 'GET') 1684 request.method = 'HEAD' 1685 self.assertEqual(request.get_method(), 'HEAD') 1686 1687 1688class URL2PathNameTests(unittest.TestCase): 1689 1690 def test_converting_drive_letter(self): 1691 self.assertEqual(url2pathname("///C|"), 'C:') 1692 self.assertEqual(url2pathname("///C:"), 'C:') 1693 self.assertEqual(url2pathname("///C|/"), 'C:\\') 1694 1695 def test_converting_when_no_drive_letter(self): 1696 # cannot end a raw string in \ 1697 self.assertEqual(url2pathname("///C/test/"), r'\\\C\test' '\\') 1698 self.assertEqual(url2pathname("////C/test/"), r'\\C\test' '\\') 1699 1700 def test_simple_compare(self): 1701 self.assertEqual(url2pathname("///C|/foo/bar/spam.foo"), 1702 r'C:\foo\bar\spam.foo') 1703 1704 def test_non_ascii_drive_letter(self): 1705 self.assertRaises(IOError, url2pathname, "///\u00e8|/") 1706 1707 def test_roundtrip_url2pathname(self): 1708 list_of_paths = ['C:', 1709 r'\\\C\test\\', 1710 r'C:\foo\bar\spam.foo' 1711 ] 1712 for path in list_of_paths: 1713 self.assertEqual(url2pathname(pathname2url(path)), path) 1714 1715class PathName2URLTests(unittest.TestCase): 1716 1717 def test_converting_drive_letter(self): 1718 self.assertEqual(pathname2url("C:"), '///C:') 1719 self.assertEqual(pathname2url("C:\\"), '///C:') 1720 1721 def test_converting_when_no_drive_letter(self): 1722 self.assertEqual(pathname2url(r"\\\folder\test" "\\"), 1723 '/////folder/test/') 1724 self.assertEqual(pathname2url(r"\\folder\test" "\\"), 1725 '////folder/test/') 1726 self.assertEqual(pathname2url(r"\folder\test" "\\"), 1727 '/folder/test/') 1728 1729 def test_simple_compare(self): 1730 self.assertEqual(pathname2url(r'C:\foo\bar\spam.foo'), 1731 "///C:/foo/bar/spam.foo" ) 1732 1733 def test_long_drive_letter(self): 1734 self.assertRaises(IOError, pathname2url, "XX:\\") 1735 1736 def test_roundtrip_pathname2url(self): 1737 list_of_paths = ['///C:', 1738 '/////folder/test/', 1739 '///C:/foo/bar/spam.foo'] 1740 for path in list_of_paths: 1741 self.assertEqual(pathname2url(url2pathname(path)), path) 1742 1743if __name__ == '__main__': 1744 unittest.main() 1745