mirror of
				https://github.com/python/cpython.git
				synced 2025-10-25 18:54:53 +00:00 
			
		
		
		
	 1afc169616
			
		
	
	
		1afc169616
		
	
	
	
	
		
			
			It consists of code from urllib, urllib2, urlparse, and robotparser. The old modules have all been removed. The new package has five submodules: urllib.parse, urllib.request, urllib.response, urllib.error, and urllib.robotparser. The urllib.request.urlopen() function uses the url opener from urllib2. Note that the unittests have not been renamed for the beta, but they will be renamed in the future. Joint work with Senthil Kumaran.
		
			
				
	
	
		
			196 lines
		
	
	
	
		
			6.9 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			196 lines
		
	
	
	
		
			6.9 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python
 | |
| 
 | |
| import unittest
 | |
| from test import support
 | |
| 
 | |
| import socket
 | |
| import urllib.request
 | |
| import sys
 | |
| import os
 | |
| import email.message
 | |
| 
 | |
| 
 | |
| def _open_with_retry(func, host, *args, **kwargs):
 | |
|     # Connecting to remote hosts is flaky.  Make it more robust
 | |
|     # by retrying the connection several times.
 | |
|     last_exc = None
 | |
|     for i in range(3):
 | |
|         try:
 | |
|             return func(host, *args, **kwargs)
 | |
|         except IOError as err:
 | |
|             last_exc = err
 | |
|             continue
 | |
|         except:
 | |
|             raise
 | |
|     raise last_exc
 | |
| 
 | |
| 
 | |
| class URLTimeoutTest(unittest.TestCase):
 | |
| 
 | |
|     TIMEOUT = 10.0
 | |
| 
 | |
|     def setUp(self):
 | |
|         socket.setdefaulttimeout(self.TIMEOUT)
 | |
| 
 | |
|     def tearDown(self):
 | |
|         socket.setdefaulttimeout(None)
 | |
| 
 | |
|     def testURLread(self):
 | |
|         f = _open_with_retry(urllib.request.urlopen, "http://www.python.org/")
 | |
|         x = f.read()
 | |
| 
 | |
| class urlopenNetworkTests(unittest.TestCase):
 | |
|     """Tests urllib.reqest.urlopen using the network.
 | |
| 
 | |
|     These tests are not exhaustive.  Assuming that testing using files does a
 | |
|     good job overall of some of the basic interface features.  There are no
 | |
|     tests exercising the optional 'data' and 'proxies' arguments.  No tests
 | |
|     for transparent redirection have been written.
 | |
| 
 | |
|     setUp is not used for always constructing a connection to
 | |
|     http://www.python.org/ since there a few tests that don't use that address
 | |
|     and making a connection is expensive enough to warrant minimizing unneeded
 | |
|     connections.
 | |
| 
 | |
|     """
 | |
| 
 | |
|     def urlopen(self, *args):
 | |
|         return _open_with_retry(urllib.request.urlopen, *args)
 | |
| 
 | |
|     def test_basic(self):
 | |
|         # Simple test expected to pass.
 | |
|         open_url = self.urlopen("http://www.python.org/")
 | |
|         for attr in ("read", "readline", "readlines", "fileno", "close",
 | |
|                      "info", "geturl"):
 | |
|             self.assert_(hasattr(open_url, attr), "object returned from "
 | |
|                             "urlopen lacks the %s attribute" % attr)
 | |
|         try:
 | |
|             self.assert_(open_url.read(), "calling 'read' failed")
 | |
|         finally:
 | |
|             open_url.close()
 | |
| 
 | |
|     def test_readlines(self):
 | |
|         # Test both readline and readlines.
 | |
|         open_url = self.urlopen("http://www.python.org/")
 | |
|         try:
 | |
|             self.assert_(isinstance(open_url.readline(), bytes),
 | |
|                          "readline did not return bytes")
 | |
|             self.assert_(isinstance(open_url.readlines(), list),
 | |
|                          "readlines did not return a list")
 | |
|         finally:
 | |
|             open_url.close()
 | |
| 
 | |
|     def test_info(self):
 | |
|         # Test 'info'.
 | |
|         open_url = self.urlopen("http://www.python.org/")
 | |
|         try:
 | |
|             info_obj = open_url.info()
 | |
|         finally:
 | |
|             open_url.close()
 | |
|             self.assert_(isinstance(info_obj, email.message.Message),
 | |
|                          "object returned by 'info' is not an instance of "
 | |
|                          "email.message.Message")
 | |
|             self.assertEqual(info_obj.get_content_subtype(), "html")
 | |
| 
 | |
|     def test_geturl(self):
 | |
|         # Make sure same URL as opened is returned by geturl.
 | |
|         URL = "http://www.python.org/"
 | |
|         open_url = self.urlopen(URL)
 | |
|         try:
 | |
|             gotten_url = open_url.geturl()
 | |
|         finally:
 | |
|             open_url.close()
 | |
|         self.assertEqual(gotten_url, URL)
 | |
| 
 | |
|     def test_getcode(self):
 | |
|         # test getcode() with the fancy opener to get 404 error codes
 | |
|         URL = "http://www.python.org/XXXinvalidXXX"
 | |
|         open_url = urllib.request.FancyURLopener().open(URL)
 | |
|         try:
 | |
|             code = open_url.getcode()
 | |
|         finally:
 | |
|             open_url.close()
 | |
|         self.assertEqual(code, 404)
 | |
| 
 | |
|     def test_fileno(self):
 | |
|         if (sys.platform in ('win32',) or
 | |
|             not hasattr(os, 'fdopen')):
 | |
|             # On Windows, socket handles are not file descriptors; this
 | |
|             # test can't pass on Windows.
 | |
|             return
 | |
|         # Make sure fd returned by fileno is valid.
 | |
|         open_url = self.urlopen("http://www.python.org/")
 | |
|         fd = open_url.fileno()
 | |
|         # XXX(nnorwitz): There is currently no way to pass errors, encoding,
 | |
|         # etc to fdopen. :-(
 | |
|         FILE = os.fdopen(fd)
 | |
|         FILE._errors = 'ignore'
 | |
|         try:
 | |
|             self.assert_(FILE.read(), "reading from file created using fd "
 | |
|                                       "returned by fileno failed")
 | |
|         finally:
 | |
|             FILE.close()
 | |
| 
 | |
|     def test_bad_address(self):
 | |
|         # Make sure proper exception is raised when connecting to a bogus
 | |
|         # address.
 | |
|         self.assertRaises(IOError,
 | |
|                           # SF patch 809915:  In Sep 2003, VeriSign started
 | |
|                           # highjacking invalid .com and .net addresses to
 | |
|                           # boost traffic to their own site.  This test
 | |
|                           # started failing then.  One hopes the .invalid
 | |
|                           # domain will be spared to serve its defined
 | |
|                           # purpose.
 | |
|                           # urllib.urlopen, "http://www.sadflkjsasadf.com/")
 | |
|                           urllib.request.urlopen,
 | |
|                           "http://www.python.invalid./")
 | |
| 
 | |
| class urlretrieveNetworkTests(unittest.TestCase):
 | |
|     """Tests urllib.request.urlretrieve using the network."""
 | |
| 
 | |
|     def urlretrieve(self, *args):
 | |
|         return _open_with_retry(urllib.request.urlretrieve, *args)
 | |
| 
 | |
|     def test_basic(self):
 | |
|         # Test basic functionality.
 | |
|         file_location,info = self.urlretrieve("http://www.python.org/")
 | |
|         self.assert_(os.path.exists(file_location), "file location returned by"
 | |
|                         " urlretrieve is not a valid path")
 | |
|         FILE = open(file_location, errors='ignore')
 | |
|         try:
 | |
|             self.assert_(FILE.read(), "reading from the file location returned"
 | |
|                          " by urlretrieve failed")
 | |
|         finally:
 | |
|             FILE.close()
 | |
|             os.unlink(file_location)
 | |
| 
 | |
|     def test_specified_path(self):
 | |
|         # Make sure that specifying the location of the file to write to works.
 | |
|         file_location,info = self.urlretrieve("http://www.python.org/",
 | |
|                                               support.TESTFN)
 | |
|         self.assertEqual(file_location, support.TESTFN)
 | |
|         self.assert_(os.path.exists(file_location))
 | |
|         FILE = open(file_location, errors='ignore')
 | |
|         try:
 | |
|             self.assert_(FILE.read(), "reading from temporary file failed")
 | |
|         finally:
 | |
|             FILE.close()
 | |
|             os.unlink(file_location)
 | |
| 
 | |
|     def test_header(self):
 | |
|         # Make sure header returned as 2nd value from urlretrieve is good.
 | |
|         file_location, header = self.urlretrieve("http://www.python.org/")
 | |
|         os.unlink(file_location)
 | |
|         self.assert_(isinstance(header, email.message.Message),
 | |
|                      "header is not an instance of email.message.Message")
 | |
| 
 | |
| 
 | |
| 
 | |
| def test_main():
 | |
|     support.requires('network')
 | |
|     support.run_unittest(URLTimeoutTest,
 | |
|                               urlopenNetworkTests,
 | |
|                               urlretrieveNetworkTests)
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     test_main()
 |