Python GzipFile.encode示例

编程语言: Python

命名空间/包名称: gzip

类/类型: GzipFile

方法/功能: encode

hotexamples.com的示例: 2

Python GzipFile.encode - 已找到2个示例。这些是从开源项目中提取的最受好评的gzip.GzipFile.encode现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

GzipFile(30)

close(30)

read(30)

readline(23)

flush(22)

decode(21)

__init__(10)

find(3)

_read(2)

namelist(2)

read1(2)

__enter__(2)

next(2)

encode(2)

__exit__(1)

__iter__(1)

pop(1)

open(1)

iter_lines(1)

name(1)

height(1)

getinfo(1)

_load(1)

fileno(1)

extractfile(1)

endswith(1)

size(1)

示例#1

显示文件

文件： sitemap.py 项目： daremon/urlclustering.com

def read_sitemaps(sitemaps, max_urls=10000):
    """
        Read one or more sitemaps and return all urls.
        sitemaps: a list of sitemap urls
        max_urls: stop processing more sitemaps if max_urls already found
    """
    urls = set()
    while len(sitemaps) > 0:
        url = sitemaps.pop(0)
        webpage = _fetch_url(url)
        if len(webpage) == 0:
            continue
        # not every server returns correct Content-Encoding
        if "sitemaps" not in webpage[:1000]:
            try:
                webpage = GzipFile(fileobj=StringIO(webpage)).read()
                if "sitemaps" not in webpage[:1000]:
                    continue
            except:
                logging.debug(traceback.format_exc())
                continue
        # read sitemap
        logging.debug("Reading sitemap: " + url)
        if isinstance(webpage, unicode):
            webpage = webpage.encode("utf-8")
        _read_sitemap(webpage, urls, sitemaps)
        logging.debug("URLs so far: %s" % len(urls))
        if len(urls) > max_urls:
            break
    return list(urls)[:max_urls]

示例#2

显示文件

文件： morss.py 项目： SamuelMarks/morss

    def http_response(self, req, resp):
        urllib2.HTTPCookieProcessor.http_response(self, req, resp)
        data = resp.read()

        if 200 <= resp.code < 300:
            # gzip
            if resp.headers.get('Content-Encoding') == 'gzip':
                log('un-gzip')
                data = GzipFile(fileobj=StringIO(data), mode='r').read()

        if 200 <= resp.code < 300 and resp.info().maintype == 'text':
            # <meta> redirect
            if resp.info().type in MIMETYPE['html']:
                match = re.search(r'(?i)<meta http-equiv=.refresh[^>]*?url=(http.*?)["\']', data)
                if match:
                    new_url = match.groups()[0]
                    log('redirect: %s' % new_url)

                    new_headers = dict((k, v) for k, v in req.headers.items()
                                       if k.lower() not in ('content-length', 'content-type'))
                    new = urllib2.Request(new_url,
                                          headers=new_headers,
                                          origin_req_host=req.get_origin_req_host(),
                                          unverifiable=True)

                    return self.parent.open(new, timeout=req.timeout)

            # encoding
            enc = detect_encoding(data, resp)

            if enc:
                data = data.decode(enc, 'replace')

                if not self.decode:
                    data = data.encode(enc)

        fp = StringIO(data)
        old_resp = resp
        resp = urllib2.addinfourl(fp, old_resp.headers, old_resp.url, old_resp.code)
        resp.msg = old_resp.msg

        return resp