Пример #1
0
 def __init__(self,url,callback,method='GET',headers=None,need_proxy=False,fail_time=0,timeout=TIMEOUT):
     # super(WeixinRequest,self).__init__(method,url,headers)   #继承父类的顺序不能乱
     Request.__init__(self,method,url,headers)
     self.callback=callback
     self.need_proxy=need_proxy
     self.fail_time=fail_time
     self.timeout=timeout
Пример #2
0
 def __init__(self, url, callback, method='GET', headers=None, timeout=3, proxy=None, params=None, data=None):
     Request.__init__(url, method, headers)
     self.callback = callback
     self.timeout = timeout
     self.proxy = proxy
     self.params = params
     self.data = data
Пример #3
0
 def __init__(self, url, callback, method='GET', header=None, need_proxy=False, fail_time=0,
              timeout=TIMEOUT):
     Request.__init__(self, method, url, header)
     self.callback = callback
     self.need_proxy = need_proxy
     self.fail_time = fail_time
     self.timeout = timeout
 def __init__(self, url=None, callback, method='GET', 
         headers=None, need_proxy=False, fail_times=0, timeout=TIMEOUT):
     Request.__init__(self, method, url, headers)
     self.callback = callback
     self.need_proxy = need_proxy
     self.fail_times = fail_times
     self.timeout = timeout
Пример #5
0
 def __init__(self, url, callback, method='GET', headers=None, need_proxy=False, fail_time=0, timeout=5):
     if headers is None:
         headers = self.DEFAULT_HEADERS
     Request.__init__(self, method, url, headers)
     self.callback = callback
     self.need_proxy = need_proxy
     self.fail_time = fail_time
     self.timeout = timeout
Пример #6
0
    def __init__(self: HTTPEntity, cert: Dict = None):
        """HTTPEntity base class constructor

        Args:
            cert (Dict): certificate for authentication.
        """
        Request.__init__(self)
        return
Пример #7
0
 def __init__(self,
              method='GET', url=None, headers=None, files=None, data=None,
              params=None, auth=None, cookies=None, hooks=None, json=None,
              call_back=None, need_proxy=False, failtime=0, timeout=10):
     Request.__init__(self, method, url, headers)
     self.call_back = call_back
     self.need_proxy = need_proxy
     self.failtime = failtime
     self.timeout = timeout
Пример #8
0
    def __init__(self: HTTPEntity, cert: Dict=None):
        """HTTPEntity base class constructor

        Args:
            cert (Dict): certificate for authentication.
        """
        warnings.filterwarnings(action="ignore", message="unclosed", category=ResourceWarning)
        Request.__init__(self)
        return
Пример #9
0
 def __init__(self,
              method='GET',
              callback=None,
              need_proxy=False,
              fail_time=0,
              *args,
              **kwargs):
     Request.__init__(self, method, *args, **kwargs)
     self.callback = callback
     self.need_proxy = need_proxy
     self.fail_time = fail_time
Пример #10
0
 def __init__(self,
              url,
              callback,
              method='GET',
              headers=None,
              need_proxy=False,
              fail_time=0,
              timeout=TIMEOUT):
     Request.__init__(self, method, url, headers)
     self.callback = callback  #回调函数
     self.need_proxy = need_proxy  #是否需要代理爬取
     self.fail_time = fail_time  #失败次数
     self.timeout = timeout  #超时时间
Пример #11
0
 def __init__(self,
              url,
              method='GET',
              headers=None,
              callback=None,
              need_proxy=None,
              timeout=TIMEOUT,
              failed_time=0):
     Request.__init__(self, method, url, headers)
     self.need_proxy = need_proxy
     self.callback = callback
     self.failed_time = failed_time
     self.timeout = timeout
Пример #12
0
 def __init__(self,
              url,
              callback,
              method='GET',
              headers=None,
              need_proxy=False,
              fail_time=0,
              timeout=TIMEOUT):
     #注意此处三个参数顺序不能写错,或者写成url=url的形式
     Request.__init__(self, method, url, headers)
     self.callback = callback
     self.need_proxy = need_proxy
     self.fail_time = fail_time
     self.timeout = timeout
Пример #13
0
 def __init__(self,
              url,
              callback,
              method='GET',
              headers=None,
              timeout=3,
              proxy=None,
              params=None,
              data=None):
     Request.__init__(url, method, headers)
     self.callback = callback
     self.timeout = timeout
     self.proxy = proxy
     self.params = params
     self.data = data
Пример #14
0
 def __init__(self,
              url,
              callback,
              method='GET',
              headers=None,
              need_proxy=False,
              fail_time=0,
              timeout=TIMEOUT):
     # 继承调用Request中的方法
     Request.__init__(self, method, url, headers)
     # 添加额外的参数 +--
     self.callback = callback
     self.need_proxy = need_proxy
     self.fail_time = fail_time
     self.timeout = timeout
Пример #15
0
    def __init__(self, method=None, url=None, proxy_name=None, headers=None, files=None,
                 data=None, params=None, auth=None, cookies=None, hooks=None,
                 crawler_name=None, timeout=None, json=None):
        '''This this the `Reqeust` class in ysacrapy.

        :param method: string, http method such as "GET", "POST", etc.
        :param url: string, http request url to use.
        :param proxy_name: string, get http proxy from proxy set using this proxy_name.
        :param headers: dict, http request headers.
        :param data: string, use data if `method` is "POST".
        :param cookies: dict, http request cookies.
        :param crawler_name: string, crawler name to use with this `Request` object.


        Use `requests.Request` as base class to keep interface simple. 
        Just use this class like `requests.Request`.

        '''

        RequestLib.__init__(
            self,
            method=method,
            url=url,
            headers=headers,
            files=files,
            data=data,
            params=params,
            auth=auth,
            cookies=cookies,
            hooks=hooks,
            json=json
        )
        self.data = data if data else ''
        self.crawler_name = crawler_name
        self.timeout = timeout
        self.proxy_name = proxy_name
        self.method = method if method else 'GET'
        self.timeout = timeout if timeout else 15
Пример #16
0
    def __init__(self,
                 url,
                 callback,
                 method="GET",
                 headers=None,
                 need_proxy=False,
                 fail_time=0,
                 timeout=TIMEOUT):
        """

        :param url: 请求的URL
        :param callback: 回调函数
        :param method: 默认 GET 请求
        :param headers: 默认无请求头
        :param need_proxy: 默认不使用代理
        :param fail_time: 失败重试次数
        :param timeout: 超时时间
        """
        Request.__init__(self, method, url, headers)
        self.callback = callback
        self.need_proxy = need_proxy
        self.fail_time = fail_time
        self.timeout = timeout
Пример #17
0
    def __init__(self,
                 url,
                 callback,
                 method='GET',
                 headers=None,
                 need_proxy=NEED_PROXY,
                 timeout=TIMEOUT,
                 fail_time=0):
        """

        :param url: url
        :param callback: 回调函数
        :param method: 请求方法
        :param headers: 请求头
        :param need_proxy: 是否需要代理
        :param timeout: 超时时间
        :param fail_time: 请求失败次数
        """
        Request.__init__(self, method, url, headers)
        self.callback = callback
        self.need_proxy = need_proxy
        self.timeout = timeout
        self.fail_time = fail_time
 def __init__(self, url, callback, method='GET', headers=None, need_proxy=False, fail_time=0, timeout=TIMEOUT):
     Request.__init__(self, method, url, headers)
     self.callback = callback    # 加入额外参数callback回调函数:知道请求的响应用什么方法来处理
     self.need_proxy = need_proxy    # 是否需要代理爬取
     self.fail_time = fail_time      # 失败次数:可以知道请求失败了多少次,判断失败次数是否到了阈值,该不该丢弃这个请求
     self.timeout = timeout      # 超时时间