Vega strike Python Modules doc: URLopener Class Reference

def addheader	(	self,
		args
	)

Add a header to be used by the HTTP interface only
e.g. u.addheader('Accept', 'sound/basic')

Definition at line 143 of file urllib.py.

 
     def addheader(self, *args):
         """Add a header to be used by the HTTP interface only
         e.g. u.addheader('Accept', 'sound/basic')"""
         self.addheaders.append(args)

def cleanup ( self)

Definition at line 129 of file urllib.py.

References URLopener.__tempfiles, URLopener.__unlink, and URLopener.tempcache.

 
     def cleanup(self):
         # This code sometimes runs when the rest of this module
         # has already been deleted, so it can't use any globals
         # or import anything.
         if self.__tempfiles:
             for file in self.__tempfiles:
                 try:
                     self.__unlink(file)
                 except OSError:
                     pass
             del self.__tempfiles[:]
         if self.tempcache:
             self.tempcache.clear()

def close ( self)

Definition at line 126 of file urllib.py.

References URLopener.cleanup().

 
     def close(self):
         self.cleanup()

def http_error	(	self,
		url,
		fp,
		errcode,
		errmsg,
		headers,
		data = `None`
	)

Handle http errors.
Derived class can override this, or provide specific handlers
named http_error_DDD where DDD is the 3-digit error code.

Definition at line 305 of file urllib.py.

References URLopener.http_error_default().

 
     def http_error(self, url, fp, errcode, errmsg, headers, data=None):
         """Handle http errors.
         Derived class can override this, or provide specific handlers
         named http_error_DDD where DDD is the 3-digit error code."""
         # First check if there's a specific handler for this error
         name = 'http_error_%d' % errcode
         if hasattr(self, name):
             method = getattr(self, name)
             if data is None:
                 result = method(url, fp, errcode, errmsg, headers)
             else:
                 result = method(url, fp, errcode, errmsg, headers, data)
             if result: return result
         return self.http_error_default(url, fp, errcode, errmsg, headers)

def http_error_default	(	self,
		url,
		fp,
		errcode,
		errmsg,
		headers
	)

Default error handler: close the connection and raise IOError.

Definition at line 320 of file urllib.py.

 
     def http_error_default(self, url, fp, errcode, errmsg, headers):
         """Default error handler: close the connection and raise IOError."""
         void = fp.read()
         fp.close()
         raise IOError, ('http error', errcode, errmsg, headers)

def open	(	self,
		fullurl,
		data = `None`
	)

Use URLopener().open(file) instead of open(file, 'r').

Definition at line 149 of file urllib.py.

References URLopener.proxies, urllib.splithost(), urllib.splittype(), URLopener.tempcache, urllib.toBytes(), and urllib.unwrap().

 
     def open(self, fullurl, data=None):
         """Use URLopener().open(file) instead of open(file, 'r')."""
         fullurl = unwrap(toBytes(fullurl))
         if self.tempcache and self.tempcache.has_key(fullurl):
             filename, headers = self.tempcache[fullurl]
             fp = open(filename, 'rb')
             return addinfourl(fp, headers, fullurl)
         urltype, url = splittype(fullurl)
         if not urltype:
             urltype = 'file'
         if self.proxies.has_key(urltype):
             proxy = self.proxies[urltype]
             urltype, proxyhost = splittype(proxy)
             host, selector = splithost(proxyhost)
             url = (host, fullurl) # Signal special case to open_*()
         else:
             proxy = None
         name = 'open_' + urltype
         self.type = urltype
         if '-' in name:
             # replace - with _
             name = '_'.join(name.split('-'))
         if not hasattr(self, name):
             if proxy:
                 return self.open_unknown_proxy(proxy, fullurl, data)
             else:
                 return self.open_unknown(fullurl, data)
         try:
             if data is None:
                 return getattr(self, name)(url)
             else:
                 return getattr(self, name)(url, data)
         except socket.error, msg:
             raise IOError, ('socket error', msg), sys.exc_info()[2]

def open_data	(	self,
		url,
		data = `None`
	)

Use "data" URL.

Definition at line 491 of file urllib.py.

References base64.decodestring(), dospath.join(), and urllib.unquote().

 
     def open_data(self, url, data=None):
         """Use "data" URL."""
         # ignore POSTed data
         #
         # syntax of data URLs:
         # dataurl   := "data:" [ mediatype ] [ ";base64" ] "," data
         # mediatype := [ type "/" subtype ] *( ";" parameter )
         # data      := *urlchar
         # parameter := attribute "=" value
         import StringIO, mimetools, time
         try:
             [type, data] = url.split(',', 1)
         except ValueError:
             raise IOError, ('data error', 'bad data URL')
         if not type:
             type = 'text/plain;charset=US-ASCII'
         semi = type.rfind(';')
         if semi >= 0 and '=' not in type[semi:]:
             encoding = type[semi+1:]
             type = type[:semi]
         else:
             encoding = ''
         msg = []
         msg.append('Date: %s'%time.strftime('%a, %d %b %Y %T GMT',
                                             time.gmtime(time.time())))
         msg.append('Content-type: %s' % type)
         if encoding == 'base64':
             import base64
             data = base64.decodestring(data)
         else:
             data = unquote(data)
         msg.append('Content-length: %d' % len(data))
         msg.append('')
         msg.append(data)
         msg = '\n'.join(msg)
         f = StringIO.StringIO(msg)
         headers = mimetools.Message(f, 0)
         f.fileno = None     # needed for addinfourl
         return addinfourl(f, headers, url)
 

def open_file	(	self,
		url
	)

Use local file or FTP depending on form of URL.

Definition at line 400 of file urllib.py.

References URLopener.open_ftp(), and URLopener.open_local_file().

 
     def open_file(self, url):
         """Use local file or FTP depending on form of URL."""
         if url[:2] == '//' and url[2:3] != '/':
             return self.open_ftp(url)
         else:
             return self.open_local_file(url)

def open_ftp	(	self,
		url
	)

Use FTP protocol.

Definition at line 435 of file urllib.py.

References URLopener.ftpcache, urllib.ftperrors(), mimetypes.guess_type(), dospath.join(), urllib.splitattr(), urllib.splithost(), urllib.splitpasswd(), urllib.splitport(), urllib.splituser(), urllib.splitvalue(), and urllib.unquote().

 
     def open_ftp(self, url):
         """Use FTP protocol."""
         import mimetypes, mimetools, StringIO
         host, path = splithost(url)
         if not host: raise IOError, ('ftp error', 'no host given')
         host, port = splitport(host)
         user, host = splituser(host)
         if user: user, passwd = splitpasswd(user)
         else: passwd = None
         host = unquote(host)
         user = unquote(user or '')
         passwd = unquote(passwd or '')
         host = socket.gethostbyname(host)
         if not port:
             import ftplib
             port = ftplib.FTP_PORT
         else:
             port = int(port)
         path, attrs = splitattr(path)
         path = unquote(path)
         dirs = path.split('/')
         dirs, file = dirs[:-1], dirs[-1]
         if dirs and not dirs[0]: dirs = dirs[1:]
         if dirs and not dirs[0]: dirs[0] = '/'
         key = user, host, port, '/'.join(dirs)
         # XXX thread unsafe!
         if len(self.ftpcache) > MAXFTPCACHE:
             # Prune the cache, rather arbitrarily
             for k in self.ftpcache.keys():
                 if k != key:
                     v = self.ftpcache[k]
                     del self.ftpcache[k]
                     v.close()
         try:
             if not self.ftpcache.has_key(key):
                 self.ftpcache[key] = \
                     ftpwrapper(user, passwd, host, port, dirs)
             if not file: type = 'D'
             else: type = 'I'
             for attr in attrs:
                 attr, value = splitvalue(attr)
                 if attr.lower() == 'type' and \
                    value in ('a', 'A', 'i', 'I', 'd', 'D'):
                     type = value.upper()
             (fp, retrlen) = self.ftpcache[key].retrfile(file, type)
             mtype = mimetypes.guess_type("ftp:" + url)[0]
             headers = ""
             if mtype:
                 headers += "Content-Type: %s\n" % mtype
             if retrlen is not None and retrlen >= 0:
                 headers += "Content-Length: %d\n" % retrlen
             headers = mimetools.Message(StringIO.StringIO(headers))
             return addinfourl(fp, headers, "ftp:" + url)
         except ftperrors(), msg:
             raise IOError, ('ftp error', msg), sys.exc_info()[2]

def open_gopher	(	self,
		url
	)

Use Gopher protocol.

Definition at line 384 of file urllib.py.

References urllib.noheaders(), gopherlib.send_query(), gopherlib.send_selector(), urllib.splitgophertype(), urllib.splithost(), urllib.splitquery(), and urllib.unquote().

 
     def open_gopher(self, url):
         """Use Gopher protocol."""
         import gopherlib
         host, selector = splithost(url)
         if not host: raise IOError, ('gopher error', 'no host given')
         host = unquote(host)
         type, selector = splitgophertype(selector)
         selector, query = splitquery(selector)
         selector = unquote(selector)
         if query:
             query = unquote(query)
             fp = gopherlib.send_query(selector, query, host)
         else:
             fp = gopherlib.send_selector(selector, host)
         return addinfourl(fp, noheaders(), "gopher:" + url)

def open_http	(	self,
		url,
		data = `None`
	)

Use HTTP protocol.

Definition at line 249 of file urllib.py.

References URLopener.addheaders, base64.encodestring(), URLopener.http_error(), urllib.proxy_bypass(), urllib.splithost(), urllib.splittype(), urllib.splituser(), string.strip(), URLopener.type, and urllib.unquote().

 
     def open_http(self, url, data=None):
         """Use HTTP protocol."""
         import httplib
         user_passwd = None
         if type(url) is types.StringType:
             host, selector = splithost(url)
             if host:
                 user_passwd, host = splituser(host)
                 host = unquote(host)
             realhost = host
         else:
             host, selector = url
             urltype, rest = splittype(selector)
             url = rest
             user_passwd = None
             if urltype.lower() != 'http':
                 realhost = None
             else:
                 realhost, rest = splithost(rest)
                 if realhost:
                     user_passwd, realhost = splituser(realhost)
                 if user_passwd:
                     selector = "%s://%s%s" % (urltype, realhost, rest)
                 if proxy_bypass(realhost):
                     host = realhost
 
             #print "proxy via http:", host, selector
         if not host: raise IOError, ('http error', 'no host given')
         if user_passwd:
             import base64
             auth = base64.encodestring(user_passwd).strip()
         else:
             auth = None
         h = httplib.HTTP(host)
         if data is not None:
             h.putrequest('POST', selector)
             h.putheader('Content-type', 'application/x-www-form-urlencoded')
             h.putheader('Content-length', '%d' % len(data))
         else:
             h.putrequest('GET', selector)
         if auth: h.putheader('Authorization', 'Basic %s' % auth)
         if realhost: h.putheader('Host', realhost)
         for args in self.addheaders: apply(h.putheader, args)
         h.endheaders()
         if data is not None:
             h.send(data)
         errcode, errmsg, headers = h.getreply()
         fp = h.getfile()
         if errcode == 200:
             return addinfourl(fp, headers, "http:" + url)
         else:
             if data is None:
                 return self.http_error(url, fp, errcode, errmsg, headers)
             else:
                 return self.http_error(url, fp, errcode, errmsg, headers, data)

def open_https	(	self,
		url,
		data = `None`
	)

Use HTTPS protocol.

Definition at line 327 of file urllib.py.

References URLopener.addheaders, URLopener.cert_file, HTTPSConnection.cert_file, HTTPS.cert_file, base64.encodestring(), URLopener.http_error(), URLopener.key_file, HTTPSConnection.key_file, HTTPS.key_file, urllib.splithost(), urllib.splittype(), urllib.splituser(), string.strip(), URLopener.type, and urllib.unquote().

 
         def open_https(self, url, data=None):
             """Use HTTPS protocol."""
             import httplib
             user_passwd = None
             if type(url) is types.StringType:
                 host, selector = splithost(url)
                 if host:
                     user_passwd, host = splituser(host)
                     host = unquote(host)
                 realhost = host
             else:
                 host, selector = url
                 urltype, rest = splittype(selector)
                 url = rest
                 user_passwd = None
                 if urltype.lower() != 'https':
                     realhost = None
                 else:
                     realhost, rest = splithost(rest)
                     if realhost:
                         user_passwd, realhost = splituser(realhost)
                     if user_passwd:
                         selector = "%s://%s%s" % (urltype, realhost, rest)
                 #print "proxy via https:", host, selector
             if not host: raise IOError, ('https error', 'no host given')
             if user_passwd:
                 import base64
                 auth = base64.encodestring(user_passwd).strip()
             else:
                 auth = None
             h = httplib.HTTPS(host, 0,
                               key_file=self.key_file,
                               cert_file=self.cert_file)
             if data is not None:
                 h.putrequest('POST', selector)
                 h.putheader('Content-type',
                             'application/x-www-form-urlencoded')
                 h.putheader('Content-length', '%d' % len(data))
             else:
                 h.putrequest('GET', selector)
             if auth: h.putheader('Authorization: Basic %s' % auth)
             if realhost: h.putheader('Host', realhost)
             for args in self.addheaders: apply(h.putheader, args)
             h.endheaders()
             if data is not None:
                 h.send(data)
             errcode, errmsg, headers = h.getreply()
             fp = h.getfile()
             if errcode == 200:
                 return addinfourl(fp, headers, "https:" + url)
             else:
                 if data is None:
                     return self.http_error(url, fp, errcode, errmsg, headers)
                 else:
                     return self.http_error(url, fp, errcode, errmsg, headers,
                                            data)

def open_local_file	(	self,
		url
	)

Use local file.

Definition at line 407 of file urllib.py.

References rfc822.formatdate(), mimetypes.guess_type(), urllib.localhost(), URLopener.open(), urllib.splithost(), urllib.splitport(), urllib.thishost(), and urllib.url2pathname().

 
     def open_local_file(self, url):
         """Use local file."""
         import mimetypes, mimetools, rfc822, StringIO
         host, file = splithost(url)
         localname = url2pathname(file)
         stats = os.stat(localname)
         size = stats[stat.ST_SIZE]
         modified = rfc822.formatdate(stats[stat.ST_MTIME])
         mtype = mimetypes.guess_type(url)[0]
         headers = mimetools.Message(StringIO.StringIO(
             'Content-Type: %s\nContent-Length: %d\nLast-modified: %s\n' %
             (mtype or 'text/plain', size, modified)))
         if not host:
             urlfile = file
             if file[:1] == '/':
                 urlfile = 'file://' + file
             return addinfourl(open(localname, 'rb'),
                               headers, urlfile)
         host, port = splitport(host)
         if not port \
            and socket.gethostbyname(host) in (localhost(), thishost()):
             urlfile = file
             if file[:1] == '/':
                 urlfile = 'file://' + file
             return addinfourl(open(localname, 'rb'),
                               headers, urlfile)
         raise IOError, ('local file error', 'not on local host')

def open_unknown	(	self,
		fullurl,
		data = `None`
	)

Overridable interface to open unknown URL type.

Definition at line 184 of file urllib.py.

References urllib.splittype().

 
     def open_unknown(self, fullurl, data=None):
         """Overridable interface to open unknown URL type."""
         type, url = splittype(fullurl)
         raise IOError, ('url error', 'unknown url type', type)

def open_unknown_proxy	(	self,
		proxy,
		fullurl,
		data = `None`
	)

Overridable interface to open unknown URL type.

Definition at line 189 of file urllib.py.

References urllib.splittype().

 
     def open_unknown_proxy(self, proxy, fullurl, data=None):
         """Overridable interface to open unknown URL type."""
         type, url = splittype(fullurl)
         raise IOError, ('url error', 'invalid proxy for %s' % type, proxy)

def retrieve	(	self,
		url,
		filename = `None`,
		reporthook = `None`,
		data = `None`
	)

retrieve(url) returns (filename, None) for a local object
or (tempfilename, headers) for a remote object.

Definition at line 195 of file urllib.py.

References tempfile.mktemp(), Pattern.open, _posixfile_.open(), URLopener.open(), Template.open(), Telnet.open(), URLopener.open_local_file(), urllib.reporthook(), urllib.splitattr(), urllib.splithost(), urllib.splitquery(), urllib.splittype(), URLopener.tempcache, urllib.toBytes(), urllib.unwrap(), and urllib.url2pathname().

 
     def retrieve(self, url, filename=None, reporthook=None, data=None):
         """retrieve(url) returns (filename, None) for a local object
         or (tempfilename, headers) for a remote object."""
         url = unwrap(toBytes(url))
         if self.tempcache and self.tempcache.has_key(url):
             return self.tempcache[url]
         type, url1 = splittype(url)
         if not filename and (not type or type == 'file'):
             try:
                 fp = self.open_local_file(url1)
                 hdrs = fp.info()
                 del fp
                 return url2pathname(splithost(url1)[1]), hdrs
             except IOError, msg:
                 pass
         fp = self.open(url, data)
         headers = fp.info()
         if not filename:
             import tempfile
             garbage, path = splittype(url)
             garbage, path = splithost(path or "")
             path, garbage = splitquery(path or "")
             path, garbage = splitattr(path or "")
             suffix = os.path.splitext(path)[1]
             filename = tempfile.mktemp(suffix)
             self.__tempfiles.append(filename)
         result = filename, headers
         if self.tempcache is not None:
             self.tempcache[url] = result
         tfp = open(filename, 'wb')
         bs = 1024*8
         size = -1
         blocknum = 1
         if reporthook:
             if headers.has_key("content-length"):
                 size = int(headers["Content-Length"])
             reporthook(0, bs, size)
         block = fp.read(bs)
         if reporthook:
             reporthook(1, bs, size)
         while block:
             tfp.write(block)
             block = fp.read(bs)
             blocknum = blocknum + 1
             if reporthook:
                 reporthook(blocknum, bs, size)
         fp.close()
         tfp.close()
         del fp
         del tfp
         return result

addheaders

Definition at line 107 of file urllib.py.

cert_file

Definition at line 106 of file urllib.py.

ftpcache

Definition at line 117 of file urllib.py.

key_file

Definition at line 105 of file urllib.py.

proxies

Definition at line 104 of file urllib.py.

tempcache

Definition at line 110 of file urllib.py.

type

Definition at line 167 of file urllib.py.

string version = "Python-urllib/%s"

static

Definition at line 97 of file urllib.py.

def __init__	(	self,
		proxies = `None`,
		x509
	)

Public Member Functions

Data Fields

Static Public Attributes

Detailed Description

Constructor & Destructor Documentation

Member Function Documentation

Field Documentation

Public Member Functions
def	__init__

def	__del__

def	close

def	cleanup

def	addheader

def	open

def	open_unknown

def	open_unknown_proxy

def	retrieve

def	open_http

def	http_error

def	http_error_default

def	open_https

def	open_gopher

def	open_file

def	open_local_file

def	open_ftp

def	open_data