106 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			Python
		
	
	
			
		
		
	
	
			106 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			Python
		
	
	
| from cStringIO import StringIO
 | |
| 
 | |
| import _response
 | |
| import _urllib2_fork
 | |
| 
 | |
| 
 | |
| # GzipConsumer was taken from Fredrik Lundh's effbot.org-0.1-20041009 library
 | |
| class GzipConsumer:
 | |
| 
 | |
|     def __init__(self, consumer):
 | |
|         self.__consumer = consumer
 | |
|         self.__decoder = None
 | |
|         self.__data = ""
 | |
| 
 | |
|     def __getattr__(self, key):
 | |
|         return getattr(self.__consumer, key)
 | |
| 
 | |
|     def feed(self, data):
 | |
|         if self.__decoder is None:
 | |
|             # check if we have a full gzip header
 | |
|             data = self.__data + data
 | |
|             try:
 | |
|                 i = 10
 | |
|                 flag = ord(data[3])
 | |
|                 if flag & 4: # extra
 | |
|                     x = ord(data[i]) + 256*ord(data[i+1])
 | |
|                     i = i + 2 + x
 | |
|                 if flag & 8: # filename
 | |
|                     while ord(data[i]):
 | |
|                         i = i + 1
 | |
|                     i = i + 1
 | |
|                 if flag & 16: # comment
 | |
|                     while ord(data[i]):
 | |
|                         i = i + 1
 | |
|                     i = i + 1
 | |
|                 if flag & 2: # crc
 | |
|                     i = i + 2
 | |
|                 if len(data) < i:
 | |
|                     raise IndexError("not enough data")
 | |
|                 if data[:3] != "\x1f\x8b\x08":
 | |
|                     raise IOError("invalid gzip data")
 | |
|                 data = data[i:]
 | |
|             except IndexError:
 | |
|                 self.__data = data
 | |
|                 return # need more data
 | |
|             import zlib
 | |
|             self.__data = ""
 | |
|             self.__decoder = zlib.decompressobj(-zlib.MAX_WBITS)
 | |
|         data = self.__decoder.decompress(data)
 | |
|         if data:
 | |
|             self.__consumer.feed(data)
 | |
| 
 | |
|     def close(self):
 | |
|         if self.__decoder:
 | |
|             data = self.__decoder.flush()
 | |
|             if data:
 | |
|                 self.__consumer.feed(data)
 | |
|         self.__consumer.close()
 | |
| 
 | |
| 
 | |
| # --------------------------------------------------------------------
 | |
| 
 | |
| # the rest of this module is John Lee's stupid code, not
 | |
| # Fredrik's nice code :-)
 | |
| 
 | |
| class stupid_gzip_consumer:
 | |
|     def __init__(self): self.data = []
 | |
|     def feed(self, data): self.data.append(data)
 | |
| 
 | |
| class stupid_gzip_wrapper(_response.closeable_response):
 | |
|     def __init__(self, response):
 | |
|         self._response = response
 | |
| 
 | |
|         c = stupid_gzip_consumer()
 | |
|         gzc = GzipConsumer(c)
 | |
|         gzc.feed(response.read())
 | |
|         self.__data = StringIO("".join(c.data))
 | |
| 
 | |
|     def read(self, size=-1):
 | |
|         return self.__data.read(size)
 | |
|     def readline(self, size=-1):
 | |
|         return self.__data.readline(size)
 | |
|     def readlines(self, sizehint=-1):
 | |
|         return self.__data.readlines(sizehint)
 | |
| 
 | |
|     def __getattr__(self, name):
 | |
|         # delegate unknown methods/attributes
 | |
|         return getattr(self._response, name)
 | |
| 
 | |
| class HTTPGzipProcessor(_urllib2_fork.BaseHandler):
 | |
|     handler_order = 200  # response processing before HTTPEquivProcessor
 | |
| 
 | |
|     def http_request(self, request):
 | |
|         request.add_header("Accept-Encoding", "gzip")
 | |
|         return request
 | |
| 
 | |
|     def http_response(self, request, response):
 | |
|         # post-process response
 | |
|         enc_hdrs = response.info().getheaders("Content-encoding")
 | |
|         for enc_hdr in enc_hdrs:
 | |
|             if ("gzip" in enc_hdr) or ("compress" in enc_hdr):
 | |
|                 return stupid_gzip_wrapper(response)
 | |
|         return response
 | |
| 
 | |
|     https_response = http_response
 |