2003-03-30 00:54:24 -04:00
|
|
|
#!/usr/bin/env python
|
|
|
|
|
|
|
|
import unittest
|
|
|
|
from test import test_support
|
|
|
|
|
|
|
|
import socket
|
2003-05-13 23:18:31 -03:00
|
|
|
import urllib
|
2003-03-30 00:54:24 -04:00
|
|
|
import sys
|
2003-05-13 23:18:31 -03:00
|
|
|
import os
|
|
|
|
import mimetools
|
2003-03-30 00:54:24 -04:00
|
|
|
|
2008-01-26 01:54:48 -04:00
|
|
|
|
|
|
|
def _open_with_retry(func, host, *args, **kwargs):
|
|
|
|
# Connecting to remote hosts is flaky. Make it more robust
|
|
|
|
# by retrying the connection several times.
|
|
|
|
for i in range(3):
|
|
|
|
try:
|
|
|
|
return func(host, *args, **kwargs)
|
|
|
|
except IOError, last_exc:
|
|
|
|
continue
|
|
|
|
except:
|
|
|
|
raise
|
|
|
|
raise last_exc
|
|
|
|
|
|
|
|
|
2003-03-30 00:54:24 -04:00
|
|
|
class URLTimeoutTest(unittest.TestCase):
|
|
|
|
|
|
|
|
TIMEOUT = 10.0
|
|
|
|
|
|
|
|
def setUp(self):
|
|
|
|
socket.setdefaulttimeout(self.TIMEOUT)
|
|
|
|
|
|
|
|
def tearDown(self):
|
|
|
|
socket.setdefaulttimeout(None)
|
|
|
|
|
|
|
|
def testURLread(self):
|
2008-01-26 01:54:48 -04:00
|
|
|
f = _open_with_retry(urllib.urlopen, "http://www.python.org/")
|
2003-03-30 00:54:24 -04:00
|
|
|
x = f.read()
|
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
class urlopenNetworkTests(unittest.TestCase):
|
|
|
|
"""Tests urllib.urlopen using the network.
|
2003-05-16 12:35:10 -03:00
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
These tests are not exhaustive. Assuming that testing using files does a
|
|
|
|
good job overall of some of the basic interface features. There are no
|
|
|
|
tests exercising the optional 'data' and 'proxies' arguments. No tests
|
|
|
|
for transparent redirection have been written.
|
2003-05-16 12:35:10 -03:00
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
setUp is not used for always constructing a connection to
|
|
|
|
http://www.python.org/ since there a few tests that don't use that address
|
|
|
|
and making a connection is expensive enough to warrant minimizing unneeded
|
|
|
|
connections.
|
2003-05-16 12:35:10 -03:00
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
"""
|
|
|
|
|
2008-01-26 01:54:48 -04:00
|
|
|
def urlopen(self, *args):
|
|
|
|
return _open_with_retry(urllib.urlopen, *args)
|
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
def test_basic(self):
|
|
|
|
# Simple test expected to pass.
|
2008-01-26 01:54:48 -04:00
|
|
|
open_url = self.urlopen("http://www.python.org/")
|
2003-05-13 23:18:31 -03:00
|
|
|
for attr in ("read", "readline", "readlines", "fileno", "close",
|
|
|
|
"info", "geturl"):
|
|
|
|
self.assert_(hasattr(open_url, attr), "object returned from "
|
|
|
|
"urlopen lacks the %s attribute" % attr)
|
|
|
|
try:
|
|
|
|
self.assert_(open_url.read(), "calling 'read' failed")
|
|
|
|
finally:
|
|
|
|
open_url.close()
|
|
|
|
|
|
|
|
def test_readlines(self):
|
|
|
|
# Test both readline and readlines.
|
2008-01-26 01:54:48 -04:00
|
|
|
open_url = self.urlopen("http://www.python.org/")
|
2003-05-13 23:18:31 -03:00
|
|
|
try:
|
|
|
|
self.assert_(isinstance(open_url.readline(), basestring),
|
|
|
|
"readline did not return a string")
|
|
|
|
self.assert_(isinstance(open_url.readlines(), list),
|
|
|
|
"readlines did not return a list")
|
|
|
|
finally:
|
|
|
|
open_url.close()
|
|
|
|
|
|
|
|
def test_info(self):
|
|
|
|
# Test 'info'.
|
2008-01-26 01:54:48 -04:00
|
|
|
open_url = self.urlopen("http://www.python.org/")
|
2003-05-13 23:18:31 -03:00
|
|
|
try:
|
|
|
|
info_obj = open_url.info()
|
|
|
|
finally:
|
|
|
|
open_url.close()
|
|
|
|
self.assert_(isinstance(info_obj, mimetools.Message),
|
|
|
|
"object returned by 'info' is not an instance of "
|
|
|
|
"mimetools.Message")
|
|
|
|
self.assertEqual(info_obj.getsubtype(), "html")
|
|
|
|
|
|
|
|
def test_geturl(self):
|
|
|
|
# Make sure same URL as opened is returned by geturl.
|
|
|
|
URL = "http://www.python.org/"
|
2008-01-26 01:54:48 -04:00
|
|
|
open_url = self.urlopen(URL)
|
2003-05-13 23:18:31 -03:00
|
|
|
try:
|
|
|
|
gotten_url = open_url.geturl()
|
|
|
|
finally:
|
|
|
|
open_url.close()
|
|
|
|
self.assertEqual(gotten_url, URL)
|
|
|
|
|
2008-01-20 07:43:03 -04:00
|
|
|
def test_getcode(self):
|
|
|
|
# test getcode() with the fancy opener to get 404 error codes
|
|
|
|
URL = "http://www.python.org/XXXinvalidXXX"
|
|
|
|
open_url = urllib.FancyURLopener().open(URL)
|
|
|
|
try:
|
|
|
|
code = open_url.getcode()
|
|
|
|
finally:
|
|
|
|
open_url.close()
|
|
|
|
self.assertEqual(code, 404)
|
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
def test_fileno(self):
|
2003-06-15 20:26:30 -03:00
|
|
|
if (sys.platform in ('win32',) or
|
2003-05-16 12:35:10 -03:00
|
|
|
not hasattr(os, 'fdopen')):
|
|
|
|
# On Windows, socket handles are not file descriptors; this
|
|
|
|
# test can't pass on Windows.
|
|
|
|
return
|
2003-05-13 23:18:31 -03:00
|
|
|
# Make sure fd returned by fileno is valid.
|
2008-01-26 01:54:48 -04:00
|
|
|
open_url = self.urlopen("http://www.python.org/")
|
2003-05-16 12:35:10 -03:00
|
|
|
fd = open_url.fileno()
|
|
|
|
FILE = os.fdopen(fd)
|
|
|
|
try:
|
|
|
|
self.assert_(FILE.read(), "reading from file created using fd "
|
|
|
|
"returned by fileno failed")
|
|
|
|
finally:
|
|
|
|
FILE.close()
|
2003-05-13 23:18:31 -03:00
|
|
|
|
|
|
|
def test_bad_address(self):
|
|
|
|
# Make sure proper exception is raised when connecting to a bogus
|
|
|
|
# address.
|
|
|
|
self.assertRaises(IOError,
|
2003-09-20 19:16:26 -03:00
|
|
|
# SF patch 809915: In Sep 2003, VeriSign started
|
|
|
|
# highjacking invalid .com and .net addresses to
|
|
|
|
# boost traffic to their own site. This test
|
|
|
|
# started failing then. One hopes the .invalid
|
|
|
|
# domain will be spared to serve its defined
|
|
|
|
# purpose.
|
|
|
|
# urllib.urlopen, "http://www.sadflkjsasadf.com/")
|
2006-06-11 17:25:56 -03:00
|
|
|
urllib.urlopen, "http://www.python.invalid./")
|
2003-05-13 23:18:31 -03:00
|
|
|
|
|
|
|
class urlretrieveNetworkTests(unittest.TestCase):
|
|
|
|
"""Tests urllib.urlretrieve using the network."""
|
|
|
|
|
2008-01-26 01:54:48 -04:00
|
|
|
def urlretrieve(self, *args):
|
|
|
|
return _open_with_retry(urllib.urlretrieve, *args)
|
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
def test_basic(self):
|
|
|
|
# Test basic functionality.
|
2008-01-26 01:54:48 -04:00
|
|
|
file_location,info = self.urlretrieve("http://www.python.org/")
|
2003-05-13 23:18:31 -03:00
|
|
|
self.assert_(os.path.exists(file_location), "file location returned by"
|
|
|
|
" urlretrieve is not a valid path")
|
|
|
|
FILE = file(file_location)
|
|
|
|
try:
|
2003-07-17 13:31:00 -03:00
|
|
|
self.assert_(FILE.read(), "reading from the file location returned"
|
|
|
|
" by urlretrieve failed")
|
2003-05-13 23:18:31 -03:00
|
|
|
finally:
|
|
|
|
FILE.close()
|
|
|
|
os.unlink(file_location)
|
|
|
|
|
|
|
|
def test_specified_path(self):
|
|
|
|
# Make sure that specifying the location of the file to write to works.
|
2008-01-26 01:54:48 -04:00
|
|
|
file_location,info = self.urlretrieve("http://www.python.org/",
|
|
|
|
test_support.TESTFN)
|
2003-05-13 23:18:31 -03:00
|
|
|
self.assertEqual(file_location, test_support.TESTFN)
|
|
|
|
self.assert_(os.path.exists(file_location))
|
|
|
|
FILE = file(file_location)
|
|
|
|
try:
|
|
|
|
self.assert_(FILE.read(), "reading from temporary file failed")
|
|
|
|
finally:
|
|
|
|
FILE.close()
|
|
|
|
os.unlink(file_location)
|
|
|
|
|
|
|
|
def test_header(self):
|
|
|
|
# Make sure header returned as 2nd value from urlretrieve is good.
|
2008-01-26 01:54:48 -04:00
|
|
|
file_location, header = self.urlretrieve("http://www.python.org/")
|
2003-05-13 23:18:31 -03:00
|
|
|
os.unlink(file_location)
|
|
|
|
self.assert_(isinstance(header, mimetools.Message),
|
|
|
|
"header is not an instance of mimetools.Message")
|
2003-05-16 12:35:10 -03:00
|
|
|
|
2003-05-13 23:18:31 -03:00
|
|
|
|
|
|
|
|
2003-03-30 00:54:24 -04:00
|
|
|
def test_main():
|
|
|
|
test_support.requires('network')
|
2008-07-01 22:57:08 -03:00
|
|
|
from warnings import filterwarnings
|
|
|
|
with test_support.catch_warning(record=False):
|
|
|
|
filterwarnings('ignore', '.*urllib\.urlopen.*Python 3.0',
|
|
|
|
DeprecationWarning)
|
|
|
|
test_support.run_unittest(URLTimeoutTest,
|
|
|
|
urlopenNetworkTests,
|
|
|
|
urlretrieveNetworkTests)
|
2003-03-30 00:54:24 -04:00
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
test_main()
|