Ejemplos de PyQuery.closest en Python

Lenguaje de programación: Python

Namespace/Package Name: pyquery

Clase / Tipo: PyQuery

Método / Función: closest

Ejemplos en hotexamples.com: 4

Python PyQuery.closest - 4 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de pyquery.PyQuery.closest extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Métodos usados con frecuencia

Mostrar Ocultar

PyQuery(30)

remove(30)

eq(30)

outerHtml(30)

attr(30)

children(30)

items(30)

html(29)

make_links_absolute(24)

split(24)

find(19)

replace(17)

__unicode__(14)

outer_html(13)

contents(12)

append(12)

size(10)

strip(9)

is_(8)

replaceWith(8)

startswith(6)

has_class(5)

encode(5)

index(4)

parents(4)

lower(4)

get(4)

next(3)

remove_namespaces(3)

hasClass(2)

parent(2)

each(2)

decode(2)

__html__(2)

closest(2)

clone(2)

add_class(2)

addClass(2)

map(2)

endswith(2)

show(1)

replace_with(1)

serialize(1)

siblings(1)

start(1)

terminate(1)

removeClass(1)

insertBefore(1)

removeAttr(1)

read(1)

Ejemplo n.º 1

Mostrar archivo

Archivo: scrape.py Proyecto: JMassapina/rewindhn

def parse(html):
    '''return a list of dictionaries describing the stories on the front page'''
    elements = []
    p = PyQuery(html)
    # 90s markup woohoo!
    anchors = p('.title:nth-child(3) a:nth-child(1)')
    for a in anchors:
        # have to re-wrap here, because PyQuery just exposes internal lxml objects upon getting iterated
        a = PyQuery(a)
        subtext = a.closest('tr').next().find('.subtext')
        if not subtext:
            # More link
            continue
        children = map(PyQuery, subtext.children())
        try:
            span, submitted, comments = children[0], children[1], children[-1]
        except IndexError:
            # filter out ads
            continue
        comments = comments.text().rpartition(' ')[0]
        comments = int(comments) if comments else 0
        url = a.attr('href')
        elements.append({
            'pos': len(elements) + 1,
            'title': a.text(),
            'url': url,
            'domain': urlparse(url).netloc.rpartition('www.')[2],
            'comments': comments,
            'submitter': submitted.text(),
            'points': int(span.text().split()[0]),
            'id': int(span.attr('id').split('_', 1)[1]),
            'ago': submitted[0].tail.split('ago')[0].strip(),
        })
    logging.warning('parsed %s elements', len(elements))
    return elements

Ejemplo n.º 2

Mostrar archivo

    def get_subforums_infos(self, html):
        """
        Get informations (description, number of topics and posts, ...) about
        the forums listed on a page
        """
        document = PyQuery(html)

        idpattern = re.compile(r"/([fc]\d+)-.*")

        for element in document("a.forumlink"):
            e = PyQuery(element)

            match = idpattern.fullmatch(clean_url(e.attr("href")))
            if not match:
                continue

            oldid = match.group(1)

            row = e.closest("tr")

            # Get forum status
            alt = row("td:nth-of-type(1) img").eq(0).attr("alt")
            self.forums[oldid].status = 1 if "verrouillé" in alt else 0

            # Get subforum description
            self.forums[oldid].description = row("td:nth-of-type(2) span").eq(
                1).html() or ""

            # TODO : Get subforum icon

            # Get subforum numbers of topics and posts
            self.forums[oldid].num_topics = int(row("td").eq(2).text())
            self.forums[oldid].num_posts = int(row("td").eq(3).text())

Ejemplo n.º 3

Mostrar archivo

Archivo: scrape.py Proyecto: 99plus2/rewindhn

def parse(html):
    '''return a list of dictionaries describing the stories on the front page'''
    elements = []
    p = PyQuery(html)
    # 90s markup woohoo!
    anchors = p('.title:nth-child(3) a:nth-child(1)')
    for a in anchors:
        # have to re-wrap here, because PyQuery just exposes internal lxml objects upon getting iterated
        a = PyQuery(a)
        subtext = a.closest('tr').next().find('.subtext')
        if not subtext:
            # More link
            continue
        children = map(PyQuery, subtext.children())
        try:
            span, submitted, comments = children[0], children[1], children[-1]
        except IndexError:
            # filter out ads
            continue
        comments = comments.text().rpartition(' ')[0]
        comments = int(comments) if comments else 0
        url = a.attr('href')
        elements.append({
                      'pos': len(elements) + 1,
                    'title': a.text(),
                      'url': url,
                   'domain': urlparse(url).netloc.rpartition('www.')[2],
                 'comments': comments,
                'submitter': submitted.text(),
                   'points': int(span.text().split()[0]),
                       'id': int(span.attr('id').split('_', 1)[1]),
                      'ago': submitted[0].tail.split('ago')[0].strip(),
                })
    logging.warning('parsed %s elements', len(elements))
    return elements

Ejemplo n.º 4

Mostrar archivo

Archivo: forums.py Proyecto: Roromis/Lalf-Forumactif

    def get_subforums_infos(self, html):
        """
        Get informations (description, number of topics and posts, ...) about
        the forums listed on a page
        """
        document = PyQuery(html)

        idpattern = re.compile(r"/([fc]\d+)-.*")

        for element in document("a.forumlink"):
            e = PyQuery(element)

            match = idpattern.fullmatch(clean_url(e.attr("href")))
            if not match:
                continue

            oldid = match.group(1)

            row = e.closest("tr")

            # Get forum status
            alt = row("td:nth-of-type(1) img").eq(0).attr("alt")
            self.forums[oldid].status = 1 if "verrouillé" in alt else 0

            # Get subforum description
            self.forums[oldid].description = row("td:nth-of-type(2) span").eq(1).html() or ""

            # TODO : Get subforum icon

            # Get subforum numbers of topics and posts
            self.forums[oldid].num_topics = int(row("td").eq(2).text())
            self.forums[oldid].num_posts = int(row("td").eq(3).text())