| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700 |
- import base64
- import os
- import email
- import urllib.parse
- import urllib.request
- import http.server
- import threading
- import unittest
- import hashlib
- from test import support
- from test.support import hashlib_helper
- from test.support import threading_helper
- from test.support import warnings_helper
- try:
- import ssl
- except ImportError:
- ssl = None
- support.requires_working_socket(module=True)
- here = os.path.dirname(__file__)
- # Self-signed cert file for 'localhost'
- CERT_localhost = os.path.join(here, 'keycert.pem')
- # Self-signed cert file for 'fakehostname'
- CERT_fakehostname = os.path.join(here, 'keycert2.pem')
- # Loopback http server infrastructure
- class LoopbackHttpServer(http.server.HTTPServer):
- """HTTP server w/ a few modifications that make it useful for
- loopback testing purposes.
- """
- def __init__(self, server_address, RequestHandlerClass):
- http.server.HTTPServer.__init__(self,
- server_address,
- RequestHandlerClass)
- # Set the timeout of our listening socket really low so
- # that we can stop the server easily.
- self.socket.settimeout(0.1)
- def get_request(self):
- """HTTPServer method, overridden."""
- request, client_address = self.socket.accept()
- # It's a loopback connection, so setting the timeout
- # really low shouldn't affect anything, but should make
- # deadlocks less likely to occur.
- request.settimeout(10.0)
- return (request, client_address)
- class LoopbackHttpServerThread(threading.Thread):
- """Stoppable thread that runs a loopback http server."""
- def __init__(self, request_handler):
- threading.Thread.__init__(self)
- self._stop_server = False
- self.ready = threading.Event()
- request_handler.protocol_version = "HTTP/1.0"
- self.httpd = LoopbackHttpServer(("127.0.0.1", 0),
- request_handler)
- self.port = self.httpd.server_port
- def stop(self):
- """Stops the webserver if it's currently running."""
- self._stop_server = True
- self.join()
- self.httpd.server_close()
- def run(self):
- self.ready.set()
- while not self._stop_server:
- self.httpd.handle_request()
- # Authentication infrastructure
- class DigestAuthHandler:
- """Handler for performing digest authentication."""
- def __init__(self):
- self._request_num = 0
- self._nonces = []
- self._users = {}
- self._realm_name = "Test Realm"
- self._qop = "auth"
- def set_qop(self, qop):
- self._qop = qop
- def set_users(self, users):
- assert isinstance(users, dict)
- self._users = users
- def set_realm(self, realm):
- self._realm_name = realm
- def _generate_nonce(self):
- self._request_num += 1
- nonce = hashlib.md5(str(self._request_num).encode("ascii")).hexdigest()
- self._nonces.append(nonce)
- return nonce
- def _create_auth_dict(self, auth_str):
- first_space_index = auth_str.find(" ")
- auth_str = auth_str[first_space_index+1:]
- parts = auth_str.split(",")
- auth_dict = {}
- for part in parts:
- name, value = part.split("=")
- name = name.strip()
- if value[0] == '"' and value[-1] == '"':
- value = value[1:-1]
- else:
- value = value.strip()
- auth_dict[name] = value
- return auth_dict
- def _validate_auth(self, auth_dict, password, method, uri):
- final_dict = {}
- final_dict.update(auth_dict)
- final_dict["password"] = password
- final_dict["method"] = method
- final_dict["uri"] = uri
- HA1_str = "%(username)s:%(realm)s:%(password)s" % final_dict
- HA1 = hashlib.md5(HA1_str.encode("ascii")).hexdigest()
- HA2_str = "%(method)s:%(uri)s" % final_dict
- HA2 = hashlib.md5(HA2_str.encode("ascii")).hexdigest()
- final_dict["HA1"] = HA1
- final_dict["HA2"] = HA2
- response_str = "%(HA1)s:%(nonce)s:%(nc)s:" \
- "%(cnonce)s:%(qop)s:%(HA2)s" % final_dict
- response = hashlib.md5(response_str.encode("ascii")).hexdigest()
- return response == auth_dict["response"]
- def _return_auth_challenge(self, request_handler):
- request_handler.send_response(407, "Proxy Authentication Required")
- request_handler.send_header("Content-Type", "text/html")
- request_handler.send_header(
- 'Proxy-Authenticate', 'Digest realm="%s", '
- 'qop="%s",'
- 'nonce="%s", ' % \
- (self._realm_name, self._qop, self._generate_nonce()))
- # XXX: Not sure if we're supposed to add this next header or
- # not.
- #request_handler.send_header('Connection', 'close')
- request_handler.end_headers()
- request_handler.wfile.write(b"Proxy Authentication Required.")
- return False
- def handle_request(self, request_handler):
- """Performs digest authentication on the given HTTP request
- handler. Returns True if authentication was successful, False
- otherwise.
- If no users have been set, then digest auth is effectively
- disabled and this method will always return True.
- """
- if len(self._users) == 0:
- return True
- if "Proxy-Authorization" not in request_handler.headers:
- return self._return_auth_challenge(request_handler)
- else:
- auth_dict = self._create_auth_dict(
- request_handler.headers["Proxy-Authorization"]
- )
- if auth_dict["username"] in self._users:
- password = self._users[ auth_dict["username"] ]
- else:
- return self._return_auth_challenge(request_handler)
- if not auth_dict.get("nonce") in self._nonces:
- return self._return_auth_challenge(request_handler)
- else:
- self._nonces.remove(auth_dict["nonce"])
- auth_validated = False
- # MSIE uses short_path in its validation, but Python's
- # urllib.request uses the full path, so we're going to see if
- # either of them works here.
- for path in [request_handler.path, request_handler.short_path]:
- if self._validate_auth(auth_dict,
- password,
- request_handler.command,
- path):
- auth_validated = True
- if not auth_validated:
- return self._return_auth_challenge(request_handler)
- return True
- class BasicAuthHandler(http.server.BaseHTTPRequestHandler):
- """Handler for performing basic authentication."""
- # Server side values
- USER = 'testUser'
- PASSWD = 'testPass'
- REALM = 'Test'
- USER_PASSWD = "%s:%s" % (USER, PASSWD)
- ENCODED_AUTH = base64.b64encode(USER_PASSWD.encode('ascii')).decode('ascii')
- def __init__(self, *args, **kwargs):
- http.server.BaseHTTPRequestHandler.__init__(self, *args, **kwargs)
- def log_message(self, format, *args):
- # Suppress console log message
- pass
- def do_HEAD(self):
- self.send_response(200)
- self.send_header("Content-type", "text/html")
- self.end_headers()
- def do_AUTHHEAD(self):
- self.send_response(401)
- self.send_header("WWW-Authenticate", "Basic realm=\"%s\"" % self.REALM)
- self.send_header("Content-type", "text/html")
- self.end_headers()
- def do_GET(self):
- if not self.headers.get("Authorization", ""):
- self.do_AUTHHEAD()
- self.wfile.write(b"No Auth header received")
- elif self.headers.get(
- "Authorization", "") == "Basic " + self.ENCODED_AUTH:
- self.send_response(200)
- self.end_headers()
- self.wfile.write(b"It works")
- else:
- # Request Unauthorized
- self.do_AUTHHEAD()
- # Proxy test infrastructure
- class FakeProxyHandler(http.server.BaseHTTPRequestHandler):
- """This is a 'fake proxy' that makes it look like the entire
- internet has gone down due to a sudden zombie invasion. It main
- utility is in providing us with authentication support for
- testing.
- """
- def __init__(self, digest_auth_handler, *args, **kwargs):
- # This has to be set before calling our parent's __init__(), which will
- # try to call do_GET().
- self.digest_auth_handler = digest_auth_handler
- http.server.BaseHTTPRequestHandler.__init__(self, *args, **kwargs)
- def log_message(self, format, *args):
- # Uncomment the next line for debugging.
- # sys.stderr.write(format % args)
- pass
- def do_GET(self):
- (scm, netloc, path, params, query, fragment) = urllib.parse.urlparse(
- self.path, "http")
- self.short_path = path
- if self.digest_auth_handler.handle_request(self):
- self.send_response(200, "OK")
- self.send_header("Content-Type", "text/html")
- self.end_headers()
- self.wfile.write(bytes("You've reached %s!<BR>" % self.path,
- "ascii"))
- self.wfile.write(b"Our apologies, but our server is down due to "
- b"a sudden zombie invasion.")
- # Test cases
- class BasicAuthTests(unittest.TestCase):
- USER = "testUser"
- PASSWD = "testPass"
- INCORRECT_PASSWD = "Incorrect"
- REALM = "Test"
- def setUp(self):
- super(BasicAuthTests, self).setUp()
- # With Basic Authentication
- def http_server_with_basic_auth_handler(*args, **kwargs):
- return BasicAuthHandler(*args, **kwargs)
- self.server = LoopbackHttpServerThread(http_server_with_basic_auth_handler)
- self.addCleanup(self.stop_server)
- self.server_url = 'http://127.0.0.1:%s' % self.server.port
- self.server.start()
- self.server.ready.wait()
- def stop_server(self):
- self.server.stop()
- self.server = None
- def tearDown(self):
- super(BasicAuthTests, self).tearDown()
- def test_basic_auth_success(self):
- ah = urllib.request.HTTPBasicAuthHandler()
- ah.add_password(self.REALM, self.server_url, self.USER, self.PASSWD)
- urllib.request.install_opener(urllib.request.build_opener(ah))
- try:
- self.assertTrue(urllib.request.urlopen(self.server_url))
- except urllib.error.HTTPError:
- self.fail("Basic auth failed for the url: %s" % self.server_url)
- def test_basic_auth_httperror(self):
- ah = urllib.request.HTTPBasicAuthHandler()
- ah.add_password(self.REALM, self.server_url, self.USER, self.INCORRECT_PASSWD)
- urllib.request.install_opener(urllib.request.build_opener(ah))
- self.assertRaises(urllib.error.HTTPError, urllib.request.urlopen, self.server_url)
- @hashlib_helper.requires_hashdigest("md5", openssl=True)
- class ProxyAuthTests(unittest.TestCase):
- URL = "http://localhost"
- USER = "tester"
- PASSWD = "test123"
- REALM = "TestRealm"
- def setUp(self):
- super(ProxyAuthTests, self).setUp()
- # Ignore proxy bypass settings in the environment.
- def restore_environ(old_environ):
- os.environ.clear()
- os.environ.update(old_environ)
- self.addCleanup(restore_environ, os.environ.copy())
- os.environ['NO_PROXY'] = ''
- os.environ['no_proxy'] = ''
- self.digest_auth_handler = DigestAuthHandler()
- self.digest_auth_handler.set_users({self.USER: self.PASSWD})
- self.digest_auth_handler.set_realm(self.REALM)
- # With Digest Authentication.
- def create_fake_proxy_handler(*args, **kwargs):
- return FakeProxyHandler(self.digest_auth_handler, *args, **kwargs)
- self.server = LoopbackHttpServerThread(create_fake_proxy_handler)
- self.addCleanup(self.stop_server)
- self.server.start()
- self.server.ready.wait()
- proxy_url = "http://127.0.0.1:%d" % self.server.port
- handler = urllib.request.ProxyHandler({"http" : proxy_url})
- self.proxy_digest_handler = urllib.request.ProxyDigestAuthHandler()
- self.opener = urllib.request.build_opener(
- handler, self.proxy_digest_handler)
- def stop_server(self):
- self.server.stop()
- self.server = None
- def test_proxy_with_bad_password_raises_httperror(self):
- self.proxy_digest_handler.add_password(self.REALM, self.URL,
- self.USER, self.PASSWD+"bad")
- self.digest_auth_handler.set_qop("auth")
- self.assertRaises(urllib.error.HTTPError,
- self.opener.open,
- self.URL)
- def test_proxy_with_no_password_raises_httperror(self):
- self.digest_auth_handler.set_qop("auth")
- self.assertRaises(urllib.error.HTTPError,
- self.opener.open,
- self.URL)
- def test_proxy_qop_auth_works(self):
- self.proxy_digest_handler.add_password(self.REALM, self.URL,
- self.USER, self.PASSWD)
- self.digest_auth_handler.set_qop("auth")
- with self.opener.open(self.URL) as result:
- while result.read():
- pass
- def test_proxy_qop_auth_int_works_or_throws_urlerror(self):
- self.proxy_digest_handler.add_password(self.REALM, self.URL,
- self.USER, self.PASSWD)
- self.digest_auth_handler.set_qop("auth-int")
- try:
- result = self.opener.open(self.URL)
- except urllib.error.URLError:
- # It's okay if we don't support auth-int, but we certainly
- # shouldn't receive any kind of exception here other than
- # a URLError.
- pass
- else:
- with result:
- while result.read():
- pass
- def GetRequestHandler(responses):
- class FakeHTTPRequestHandler(http.server.BaseHTTPRequestHandler):
- server_version = "TestHTTP/"
- requests = []
- headers_received = []
- port = 80
- def do_GET(self):
- body = self.send_head()
- while body:
- done = self.wfile.write(body)
- body = body[done:]
- def do_POST(self):
- content_length = self.headers["Content-Length"]
- post_data = self.rfile.read(int(content_length))
- self.do_GET()
- self.requests.append(post_data)
- def send_head(self):
- FakeHTTPRequestHandler.headers_received = self.headers
- self.requests.append(self.path)
- response_code, headers, body = responses.pop(0)
- self.send_response(response_code)
- for (header, value) in headers:
- self.send_header(header, value % {'port':self.port})
- if body:
- self.send_header("Content-type", "text/plain")
- self.end_headers()
- return body
- self.end_headers()
- def log_message(self, *args):
- pass
- return FakeHTTPRequestHandler
- class TestUrlopen(unittest.TestCase):
- """Tests urllib.request.urlopen using the network.
- These tests are not exhaustive. Assuming that testing using files does a
- good job overall of some of the basic interface features. There are no
- tests exercising the optional 'data' and 'proxies' arguments. No tests
- for transparent redirection have been written.
- """
- def setUp(self):
- super(TestUrlopen, self).setUp()
- # clear _opener global variable
- self.addCleanup(urllib.request.urlcleanup)
- # Ignore proxies for localhost tests.
- def restore_environ(old_environ):
- os.environ.clear()
- os.environ.update(old_environ)
- self.addCleanup(restore_environ, os.environ.copy())
- os.environ['NO_PROXY'] = '*'
- os.environ['no_proxy'] = '*'
- def urlopen(self, url, data=None, **kwargs):
- l = []
- f = urllib.request.urlopen(url, data, **kwargs)
- try:
- # Exercise various methods
- l.extend(f.readlines(200))
- l.append(f.readline())
- l.append(f.read(1024))
- l.append(f.read())
- finally:
- f.close()
- return b"".join(l)
- def stop_server(self):
- self.server.stop()
- self.server = None
- def start_server(self, responses=None):
- if responses is None:
- responses = [(200, [], b"we don't care")]
- handler = GetRequestHandler(responses)
- self.server = LoopbackHttpServerThread(handler)
- self.addCleanup(self.stop_server)
- self.server.start()
- self.server.ready.wait()
- port = self.server.port
- handler.port = port
- return handler
- def start_https_server(self, responses=None, **kwargs):
- if not hasattr(urllib.request, 'HTTPSHandler'):
- self.skipTest('ssl support required')
- from test.ssl_servers import make_https_server
- if responses is None:
- responses = [(200, [], b"we care a bit")]
- handler = GetRequestHandler(responses)
- server = make_https_server(self, handler_class=handler, **kwargs)
- handler.port = server.port
- return handler
- def test_redirection(self):
- expected_response = b"We got here..."
- responses = [
- (302, [("Location", "http://localhost:%(port)s/somewhere_else")],
- ""),
- (200, [], expected_response)
- ]
- handler = self.start_server(responses)
- data = self.urlopen("http://localhost:%s/" % handler.port)
- self.assertEqual(data, expected_response)
- self.assertEqual(handler.requests, ["/", "/somewhere_else"])
- def test_chunked(self):
- expected_response = b"hello world"
- chunked_start = (
- b'a\r\n'
- b'hello worl\r\n'
- b'1\r\n'
- b'd\r\n'
- b'0\r\n'
- )
- response = [(200, [("Transfer-Encoding", "chunked")], chunked_start)]
- handler = self.start_server(response)
- data = self.urlopen("http://localhost:%s/" % handler.port)
- self.assertEqual(data, expected_response)
- def test_404(self):
- expected_response = b"Bad bad bad..."
- handler = self.start_server([(404, [], expected_response)])
- try:
- self.urlopen("http://localhost:%s/weeble" % handler.port)
- except urllib.error.URLError as f:
- data = f.read()
- f.close()
- else:
- self.fail("404 should raise URLError")
- self.assertEqual(data, expected_response)
- self.assertEqual(handler.requests, ["/weeble"])
- def test_200(self):
- expected_response = b"pycon 2008..."
- handler = self.start_server([(200, [], expected_response)])
- data = self.urlopen("http://localhost:%s/bizarre" % handler.port)
- self.assertEqual(data, expected_response)
- self.assertEqual(handler.requests, ["/bizarre"])
- def test_200_with_parameters(self):
- expected_response = b"pycon 2008..."
- handler = self.start_server([(200, [], expected_response)])
- data = self.urlopen("http://localhost:%s/bizarre" % handler.port,
- b"get=with_feeling")
- self.assertEqual(data, expected_response)
- self.assertEqual(handler.requests, ["/bizarre", b"get=with_feeling"])
- def test_https(self):
- handler = self.start_https_server()
- context = ssl.create_default_context(cafile=CERT_localhost)
- data = self.urlopen("https://localhost:%s/bizarre" % handler.port, context=context)
- self.assertEqual(data, b"we care a bit")
- def test_https_with_cafile(self):
- handler = self.start_https_server(certfile=CERT_localhost)
- with warnings_helper.check_warnings(('', DeprecationWarning)):
- # Good cert
- data = self.urlopen("https://localhost:%s/bizarre" % handler.port,
- cafile=CERT_localhost)
- self.assertEqual(data, b"we care a bit")
- # Bad cert
- with self.assertRaises(urllib.error.URLError) as cm:
- self.urlopen("https://localhost:%s/bizarre" % handler.port,
- cafile=CERT_fakehostname)
- # Good cert, but mismatching hostname
- handler = self.start_https_server(certfile=CERT_fakehostname)
- with self.assertRaises(urllib.error.URLError) as cm:
- self.urlopen("https://localhost:%s/bizarre" % handler.port,
- cafile=CERT_fakehostname)
- def test_https_with_cadefault(self):
- handler = self.start_https_server(certfile=CERT_localhost)
- # Self-signed cert should fail verification with system certificate store
- with warnings_helper.check_warnings(('', DeprecationWarning)):
- with self.assertRaises(urllib.error.URLError) as cm:
- self.urlopen("https://localhost:%s/bizarre" % handler.port,
- cadefault=True)
- def test_https_sni(self):
- if ssl is None:
- self.skipTest("ssl module required")
- if not ssl.HAS_SNI:
- self.skipTest("SNI support required in OpenSSL")
- sni_name = None
- def cb_sni(ssl_sock, server_name, initial_context):
- nonlocal sni_name
- sni_name = server_name
- context = ssl.SSLContext(ssl.PROTOCOL_TLS_SERVER)
- context.set_servername_callback(cb_sni)
- handler = self.start_https_server(context=context, certfile=CERT_localhost)
- context = ssl.create_default_context(cafile=CERT_localhost)
- self.urlopen("https://localhost:%s" % handler.port, context=context)
- self.assertEqual(sni_name, "localhost")
- def test_sending_headers(self):
- handler = self.start_server()
- req = urllib.request.Request("http://localhost:%s/" % handler.port,
- headers={"Range": "bytes=20-39"})
- with urllib.request.urlopen(req):
- pass
- self.assertEqual(handler.headers_received["Range"], "bytes=20-39")
- def test_sending_headers_camel(self):
- handler = self.start_server()
- req = urllib.request.Request("http://localhost:%s/" % handler.port,
- headers={"X-SoMe-hEader": "foobar"})
- with urllib.request.urlopen(req):
- pass
- self.assertIn("X-Some-Header", handler.headers_received.keys())
- self.assertNotIn("X-SoMe-hEader", handler.headers_received.keys())
- def test_basic(self):
- handler = self.start_server()
- with urllib.request.urlopen("http://localhost:%s" % handler.port) as open_url:
- for attr in ("read", "close", "info", "geturl"):
- self.assertTrue(hasattr(open_url, attr), "object returned from "
- "urlopen lacks the %s attribute" % attr)
- self.assertTrue(open_url.read(), "calling 'read' failed")
- def test_info(self):
- handler = self.start_server()
- open_url = urllib.request.urlopen(
- "http://localhost:%s" % handler.port)
- with open_url:
- info_obj = open_url.info()
- self.assertIsInstance(info_obj, email.message.Message,
- "object returned by 'info' is not an "
- "instance of email.message.Message")
- self.assertEqual(info_obj.get_content_subtype(), "plain")
- def test_geturl(self):
- # Make sure same URL as opened is returned by geturl.
- handler = self.start_server()
- open_url = urllib.request.urlopen("http://localhost:%s" % handler.port)
- with open_url:
- url = open_url.geturl()
- self.assertEqual(url, "http://localhost:%s" % handler.port)
- def test_iteration(self):
- expected_response = b"pycon 2008..."
- handler = self.start_server([(200, [], expected_response)])
- data = urllib.request.urlopen("http://localhost:%s" % handler.port)
- for line in data:
- self.assertEqual(line, expected_response)
- def test_line_iteration(self):
- lines = [b"We\n", b"got\n", b"here\n", b"verylong " * 8192 + b"\n"]
- expected_response = b"".join(lines)
- handler = self.start_server([(200, [], expected_response)])
- data = urllib.request.urlopen("http://localhost:%s" % handler.port)
- for index, line in enumerate(data):
- self.assertEqual(line, lines[index],
- "Fetched line number %s doesn't match expected:\n"
- " Expected length was %s, got %s" %
- (index, len(lines[index]), len(line)))
- self.assertEqual(index + 1, len(lines))
- def test_issue16464(self):
- # See https://bugs.python.org/issue16464
- # and https://bugs.python.org/issue46648
- handler = self.start_server([
- (200, [], b'any'),
- (200, [], b'any'),
- ])
- opener = urllib.request.build_opener()
- request = urllib.request.Request("http://localhost:%s" % handler.port)
- self.assertEqual(None, request.data)
- opener.open(request, "1".encode("us-ascii"))
- self.assertEqual(b"1", request.data)
- self.assertEqual("1", request.get_header("Content-length"))
- opener.open(request, "1234567890".encode("us-ascii"))
- self.assertEqual(b"1234567890", request.data)
- self.assertEqual("10", request.get_header("Content-length"))
- def setUpModule():
- thread_info = threading_helper.threading_setup()
- unittest.addModuleCleanup(threading_helper.threading_cleanup, *thread_info)
- if __name__ == "__main__":
- unittest.main()
|