Ejemplo n.º 1
0
    def __init__(self, **kwargs):
        super(BaiduSearchBySiteKeywordSpider,self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("baidu.json").get("baidu").get("search_conf")
        self.Wait_Element = self.xpathConf.get("wait_element")
Ejemplo n.º 2
0
    def __init__(self, **kwargs):
        super(SougouWeixinFilterSpider,self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("sougou.json").get("sougou").get("sougou_weixin")
        self.Wait_Element = self.xpathConf.get("wait_element")
Ejemplo n.º 3
0
    def __init__(self, **kwargs):
        super(BaiduSinaNewsFilterSpider,self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("baidu.json").get("baidu").get("sina_news")
        self.Wait_Element = self.xpathConf.get("wait_element")
Ejemplo n.º 4
0
    def __init__(self, **kwargs):
        super(WeiboSearchStartSpider,self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weibo.json").get("weibo_com").get(self.spider_type)
        self.Wait_Element = self.xpathConf.get("wait_element")
Ejemplo n.º 5
0
    def __init__(self, **kwargs):
        super(SougouWeixinFilterSpider, self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("sougou.json").get("sougou").get(
            "sougou_weixin")
        self.Wait_Element = self.xpathConf.get("wait_element")
    def __init__(self, **kwargs):
        super(WeiboSearchStartSpider, self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weibo.json").get(
            "weibo_com").get(self.spider_type)
        self.Wait_Element = self.xpathConf.get("wait_element")
    def __init__(self, **kwargs):
        super(BaiduSinaNewsFilterSpider, self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("baidu.json").get("baidu").get(
            "sina_news")
        self.Wait_Element = self.xpathConf.get("wait_element")
    def __init__(self, **kwargs):
        super(BaiduSearchBySiteKeywordSpider, self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("baidu.json").get("baidu").get(
            "search_conf")
        self.Wait_Element = self.xpathConf.get("wait_element")
Ejemplo n.º 9
0
    def __init__(self,**kwargs):
        super(WeixinContentSpider,self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weixin.json").get(self.siteName).get(self.spider_type)
        self.Wait_Element = self.xpathConf.get("wait_element")

        self.itemKeys.append("title")
Ejemplo n.º 10
0
    def __init__(self, **kwargs):
        super(WeiboComUserInfoContentSpider,self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")
        #爬去结果输出到Redist的Key。
        self.out_key=self.name[0:self.name.index(":")]

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weibo.json").get("weibo_cn").get("user_info")
        self.Wait_Element = self.xpathConf.get("wait_element")
Ejemplo n.º 11
0
    def __init__(self, **kwargs):
        super(WeixinContentSpider, self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weixin.json").get(
            self.siteName).get(self.spider_type)
        self.Wait_Element = self.xpathConf.get("wait_element")

        self.itemKeys.append("title")
    def __init__(self, **kwargs):
        super(WeiboComUserInfoContentSpider, self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")
        #爬去结果输出到Redist的Key。
        self.out_key = self.name[0:self.name.index(":")]

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weibo.json").get("weibo_cn").get(
            "user_info")
        self.Wait_Element = self.xpathConf.get("wait_element")
Ejemplo n.º 13
0
    def __init__(self, **kwargs):
        super(WeiboComSearchSpider,self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weibo.json").get("weibo_com").get("search_conf")
        self.Wait_Element = self.xpathConf.get("wait_element")

        self.itemKeys.append('attitude')
        self.itemKeys.append('comments')
        self.itemKeys.append('repost')
        self.itemKeys.append('user_url')
    def __init__(self, **kwargs):
        super(WeiboComSearchSpider, self).__init__(**kwargs)
        self.name = kwargs.get("name")
        self.redis_key = kwargs.get("redis_key")

        #获取微博的XPath配置
        self.xpathConf = confUtil.getJsonStr("weibo.json").get(
            "weibo_com").get("search_conf")
        self.Wait_Element = self.xpathConf.get("wait_element")

        self.itemKeys.append('attitude')
        self.itemKeys.append('comments')
        self.itemKeys.append('repost')
        self.itemKeys.append('user_url')