Python Selector.getall Examples

Programming Language: Python

Namespace/Package Name: scrapy.selector

Class/Type: Selector

Method/Function: getall

Examples at hotexamples.com: 2

Python Selector.getall - 2 examples found. These are the top rated real world Python examples of scrapy.selector.Selector.getall extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Selector(30)

strip(30)

split(30)

css(30)

select(30)

replace(30)

extract(30)

re(30)

extract_first(19)

remove_namespaces(16)

index(9)

rstrip(9)

lstrip(9)

encode(8)

register_namespace(6)

find(5)

remove(4)

append(4)

startswith(3)

rindex(3)

extend(3)

get(3)

re_first(2)

getall(2)

lower(2)

pop(1)

partition(1)

extract_unquoted(1)

__getattribute__(1)

rfind(1)

items(1)

decode(1)

find_all(1)

group(1)

__len__(1)

title(1)

to_csv(1)

url(1)

Example #1

Show file

File: test.py Project: MrAccle/book_spirder

def b():
    f = open('../../book.html', mode='r', encoding='utf-8')
    body = f.read()
    # print(body)
    ul = Selector(text=body).xpath("//*[@id='subject_list']/ul/li")
    for li in ul.getall():
        str = Selector(text=li)
        # .replace("\n", "").strip()
        book_name = str.xpath("//div[@class='info']//a/@title").get()
        print(book_name)
        spider_url = str.xpath("//div[@class='info']//a/@href").get()
        print(spider_url)
        pub = str.xpath("//div[@class='pub']//text()").get().replace("\n", "").strip()
        pubs = pub.split('/')
        price = pubs[-1].strip()
        publish_time = pubs[-2].strip()
        press = pubs[-3].strip()
        authors = pubs[0:-3]
        author = ""
        for s in authors:
            author = author+s+'/'
        print(price)
        print(publish_time)
        print(press)
        print(author)
        book_content = str.xpath("//div[@class='info']/p/text()").get()
        print(book_content)

Example #2

Show file

File: test.py Project: MrAccle/book_spirder

def s():
    f = open('../../tags.html', mode='r', encoding='utf-8')
    body = f.read()
    # print(body)
    urls = Selector(text=body).xpath("//table[@class='tagCol']//td/a/@href")
    tags_name = Selector(text=body).xpath("//table[@class='tagCol']//td/a/text()")
    tags_count = Selector(text=body).xpath("//table[@class='tagCol']//td/b/text()")

    print(urls.getall())
    print(tags_name.getall())
    print(tags_count.getall())

    table = Selector(text=body).xpath("//table[@class='tagCol']//td")
    for s2 in table.getall():
        str = Selector(text=s2)
        url = str.xpath("//a/@href").get()
        name = str.xpath("//a/text()").get()
        count = str.xpath("//b/text()").get()[1:-1]
        print(url + "-" + name + "-" + count)