Пример #1
0
def getWeb(url, isFeed):
    socket.setdefaulttimeout(300)
    loadedWeb = urllib2.build_opener()
    loadedWeb.addheaders = getHeaders()
    if isFeed:
        web=etree.parse(  loadedWeb.open(url)  )
    else:
        web=html.parse(  loadedWeb.open(url)  )
    return web
Пример #2
0
def getWeb(url, isFeed):
    """Download url and parse it with lxml.
    If "isFeed" is True returns lxml.etree
    else, returns lxml.html
    """
    socket.setdefaulttimeout(300)
    loadedWeb = urllib2.build_opener()
    loadedWeb.addheaders = getHeaders()
    if isFeed:
        web = etree.parse(loadedWeb.open(url))
    else:
        web = html.parse(loadedWeb.open(url))
    return web