Python Request.from_curl 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: scrapy

클래스/타입: Request

메소드/함수: from_curl

hotexamples.com에서의 예제들: 5

Python Request.from_curl - 5개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 scrapy.Request.from_curl에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Request(30)

dont_filter(8)

from_curl(5)

cookies(4)

info(4)

item(4)

errback(3)

css(2)

__init__(1)

callback(1)

copy(1)

doubanId(1)

예제 #1

파일 보기

파일: mpbio.py 프로젝트: preetijangra15/scrapybot

 def parse_products(self, response):
     url = "https://hwo0nunfkk-dsn.algolia.net/1/indexes/*/queries?x-algolia-agent=Algolia%20for%20" \
           "JavaScript%20(3.35.1)%3B%20Browser%3B%20instantsearch.js%20(4.15.0)%3B%20Magento2%20integ" \
           "ration%20(3.1.0)%3B%20JS%20Helper%20(3.4.4)&" \
           "x-algolia-application-id=HWO0NUNFKK&x-algolia-api-key=MjEwNzc3YjI4Yjk5OWY1" \
           "NTY4NzI3NjY0MjUyZjVmNWI1YzZjMWNkOWIzNDA0NDc2YTZlYzY4NDEyMmViMzk1N3RhZ0ZpbHRlcnM9"
     yield Request.from_curl(url=self.url, callback=self.parse)

예제 #2

파일 보기

파일: audiobook_spider.py 프로젝트: ty263-1/webcrawling

 def start_requests(self):
     yield Request.from_curl(
         "curl 'https://img.tingchina.com/play/h5_jsonp.asp?0.11683375963617659' \
                   -H 'Connection: keep-alive' \
                   -H 'User-Agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/88.0.4324.96 Safari/537.36' \
                   -H 'Accept: */*' \
                   -H 'Sec-Fetch-Site: same-site' \
                   -H 'Sec-Fetch-Mode: no-cors' \
                   -H 'Sec-Fetch-Dest: script' \
                   -H 'Referer: https://www.tingchina.com/yousheng/31046/play_31046_0.htm' \
                   -H 'Accept-Language: en-US,en;q=0.9' \
                   -H 'Cookie: UM_distinctid=177461d45ea7fc-09f21ff66496a9-1e2a1f04-25a3ac-177461d45eb6a8; ting_0_31046_1=0; ting_0_31046_2=490.593481; tingNewJieshaoren=0; ASPSESSIONIDSGTTAATQ=OKMJNKKBJGNBGGHLGNPFKAHM; tingNewIP%2D0%2D31046=over; tNew_play_url=https%3A//www.tingchina.com/yousheng/31046/play_31046_0.htm; ting_0_31046_0=430.00254; cscpvrich2729_p=1' \
                   --compressed",
         callback=self.parse_key_string)

예제 #3

파일 보기

    def start_requests(self):
        self.url = 'https://crates.io/api/v1/?category=no-std&page={page}&per_page={per_page}&sort=downloads'
        #self.url = 'https://crates.io/api/v1/crates/bencher/reverse_dependencies?page={page}&per_page={per_page}'
        #self.url = 'https://crates.io/api/v1/crates?page={page}&per_page={per_page}&sort=downloads'
        def write_time():
            secs = subprocess.run(["date", "+%s"], stdout=subprocess.PIPE, text=True)
            nanos = subprocess.run(["date", "+%N"], stdout=subprocess.PIPE, text=True)
            self.results["creation_date"] = {}
            self.results["creation_date"]["secs_since_epoch"] = int(secs.stdout[:-1])
            self.results["creation_date"]["nanos_since_epoch"] = int(nanos.stdout[:-1])
            self.results["crates"] = []

        write_time()
        for page in range(self.total_page):
            yield Request.from_curl(
                "curl " + self.url.format(page=page+1, per_page=self.per_page),
                callback=self.parse)

예제 #4

파일 보기

파일: elsalvador.py 프로젝트: rongfang323/policy-data-analyzer

 def start_requests(self):
     for date in self.create_date_range(1990):
         for keyword in self.keywords:
             request = f"curl 'https://www.jurisprudencia.gob.sv/busqueda/result.php' -H 'Connection: keep-alive' -H 'Accept: */*' -H 'X-Requested-With: XMLHttpRequest' -H 'User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.193 Safari/537.36' -H 'Content-Type: application/x-www-form-urlencoded; charset=UTF-8' -H 'Origin: https://www.jurisprudencia.gob.sv' -H 'Sec-Fetch-Site: same-origin' -H 'Sec-Fetch-Mode: cors' -H 'Sec-Fetch-Dest: empty' -H 'Referer: https://www.jurisprudencia.gob.sv/busqueda/busquedaLeg.php?id=2' -H 'Accept-Language: ca,en;q=0.9' -H 'Cookie: _ga=GA1.3.499250194.1605023569; _gid=GA1.3.1562076103.1605176978; wplc_chat_status=5; _icl_current_language=es; nc_status=browsing; PHPSESSID=emkambpjvphadn3r7lracuqvg6' --data-raw 'libre=true&txtBusquedaLibre={keyword}&baseDatos=2&nivel1=0&nivel2=0&nivel3=0&nivel4=0&maximo=300&inicio={date[0]}&fin={date[1]}&tipoBusquedaFrasePalabra=1' --compressed"
             yield Request.from_curl(request, callback=self.parse)

예제 #5

파일 보기

파일: scraper.py 프로젝트: nataliepopescu/bencher_scrape

 def start_requests(self):
     url = self.url
     for page in range(self.total_page):
         yield Request.from_curl(
             "curl " + url.format(page=page+1, per_page=self.per_page),
             callback=self.parse)