| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148 |
- #!/usr/bin/python
- ####
- # 02/2006 Will Holcomb <wholcomb@gmail.com>
- #
- # This library is free software; you can redistribute it and/or
- # modify it under the terms of the GNU Lesser General Public
- # License as published by the Free Software Foundation; either
- # version 2.1 of the License, or (at your option) any later version.
- #
- # This library is distributed in the hope that it will be useful,
- # but WITHOUT ANY WARRANTY; without even the implied warranty of
- # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- # Lesser General Public License for more details.
- #
- # 7/26/07 Slightly modified by Brian Schneider
- # in order to support unicode files ( multipart_encode function )
- #
- # 10/17/07 Dirk: inherit from urllib2.HTTPHandler instead of BaseHandler to support wsgi_intercept
- """
- Usage:
- Enables the use of multipart/form-data for posting forms
- Inspirations:
- Upload files in python:
- http://aspn.activestate.com/ASPN/Cookbook/Python/Recipe/146306
- urllib2_file:
- Fabien Seisen: <fabien@seisen.org>
- Example:
- import MultipartPostHandler, urllib2, cookielib
- cookies = cookielib.CookieJar()
- opener = urllib2.build_opener(urllib2.HTTPCookieProcessor(cookies),
- MultipartPostHandler.MultipartPostHandler)
- params = { "username" : "bob", "password" : "riviera",
- "file" : open("filename", "rb") }
- opener.open("http://wwww.bobsite.com/upload/", params)
- Further Example:
- The main function of this file is a sample which downloads a page and
- then uploads it to the W3C validator.
- """
- import urllib
- import urllib2
- import mimetools, mimetypes
- import os, stat
- from cStringIO import StringIO
- #~ from wsgi_intercept import WSGI_HTTPConnection
- class Callable:
- def __init__(self, anycallable):
- self.__call__ = anycallable
- # Controls how sequences are uncoded. If true, elements may be given multiple values by
- # assigning a sequence.
- doseq = 1
- class MultipartPostHandler(urllib2.HTTPHandler):
- handler_order = urllib2.HTTPHandler.handler_order - 10 # needs to run first
- def http_request(self, request):
- data = request.get_data()
- if data is not None and type(data) != str:
- v_files = []
- v_vars = []
- try:
- for(key, value) in data.items():
- if type(value) == file:
- v_files.append((key, value))
- else:
- v_vars.append((key, value))
- except TypeError:
- tb = sys.exc_info()[2]
- try:
- raise TypeError, "not a valid non-string sequence or mapping object", tb
- finally:
- tb = None
- if len(v_files) == 0:
- data = urllib.urlencode(v_vars, doseq)
- else:
- boundary, data = self.multipart_encode(v_vars, v_files)
- contenttype = 'multipart/form-data; boundary=%s' % boundary
- if(request.has_header('Content-Type')
- and request.get_header('Content-Type').find('multipart/form-data') != 0):
- print "Replacing %s with %s" % (request.get_header('content-type'), 'multipart/form-data')
- request.add_unredirected_header('Content-Type', contenttype)
- request.add_data(data)
- return request
- #~ def http_open(self, req):
- #~ return self.do_open(WSGI_HTTPConnection, req)
- def multipart_encode(vars, files, boundary=None, buf=None):
- if boundary is None:
- boundary = mimetools.choose_boundary()
- if buf is None:
- buf = StringIO()
- for(key, value) in vars:
- buf.write('--%s\r\n' % boundary)
- buf.write('Content-Disposition: form-data; name="%s"' % key)
- buf.write('\r\n\r\n' + value + '\r\n')
- for(key, fd) in files:
- file_size = os.fstat(fd.fileno())[stat.ST_SIZE]
- filename = fd.name.split('/')[-1]
- contenttype = mimetypes.guess_type(filename)[0] or 'application/octet-stream'
- buf.write('--%s\r\n' % boundary)
- buf.write('Content-Disposition: form-data; name="%s"; filename="%s"\r\n' % (key, filename))
- buf.write('Content-Type: %s\r\n' % contenttype)
- # buffer += 'Content-Length: %s\r\n' % file_size
- fd.seek(0)
- buf.write('\r\n' + fd.read() + '\r\n')
- buf.write('--' + boundary + '--\r\n\r\n')
- buf = buf.getvalue()
- return boundary, buf
- multipart_encode = Callable(multipart_encode)
- https_request = http_request
- def main():# pragma: no cover
- import tempfile, sys
- validatorURL = "http://validator.w3.org/check"
- opener = urllib2.build_opener(MultipartPostHandler)
- def validateFile(url):
- temp = tempfile.mkstemp(suffix=".html")
- os.write(temp[0], opener.open(url).read())
- params = { "ss" : "0", # show source
- "doctype" : "Inline",
- "uploaded_file" : open(temp[1], "rb") }
- print opener.open(validatorURL, params).read()
- os.remove(temp[1])
- if len(sys.argv[1:]) > 0:
- for arg in sys.argv[1:]:
- validateFile(arg)
- else:
- validateFile("http://www.google.com")
- if __name__ == "__main__":# pragma: no cover
- main()
|