Example #1
0
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'https://www.baidu.com'
     # 当前类还没初始化结束,传给其他类的self会有问题,因此对于要传递self的类都不能在init初始化
     self.baidutieba = None
     self.baidutieba2 = None
Example #2
0
 def __init__(self):
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://www.bilibili.com/'
     self.queryUrl = 'http://search.bilibili.com/ajax_api/video?keyword={keyword}&page={page}&order=totalrank'
     #self.pageUrl = 'http://search.bilibili.com/all?keyword={keyword}&page={page}&order=totalrank'
     self.STEP_PAGES = None
     self.STEP_VIDEOS = 1
 def __init__(self, parent=None):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'https://donghua.dmzj.com/'
     self.r = RegexUtility()
     if parent:
         self.website = parent.website
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://video.sohu.com/'
     self.QUERY_TEMPLATE = 'http://so.tv.sohu.com/mts?wd={key}&flag={flag}&c={c}&length={length}&v={v}&limit={limit}&p={page}&o={o}'
     self.DEFAULT_PAGE_SIZE = 20 
     self.S2QUERY_DEFAULT = 'S2QUERY_ORIGINAL_PAGE'
     self.S2QUERY_FIRST_PAGE = 'S2QUERY_FIRST_PAGE'
     self.S2QUERY_EACH_PAGE = 'S2QUERY_EACH_PAGE'
Example #5
0
 def __init__(self):
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'https://v.qq.com'
     # 当前类还没初始化结束,传给其他类的self会有问题,因此对于要传递self的类都不能在init初始化
     self.tvtencent = None
     self.actencent = None
     self.ebooktencent = None
     self.postqqbooktencent = None
     self.newstencent = None
 def __init__(self, parent=None):
     """Constructor"""
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://book.qq.com/'
     self.QUERY_TEMPLATE = 'http://book.qq.com/search/index/wd/{key}/type//ps/{page_size}/p/{page}'
     self.DEFAULT_PAGE_SIZE = 30
     self.QUERY = None
     self.FIRST = 'FIRST'
     self.EACH = 'EACH'
     if parent:
         self.website = parent.website
Example #7
0
    def __init__(self):
        # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
        SiteS2Query.__init__(self)
        self.fakeoriginalurl = 'http://search.tianya.cn/bbs?'
        self.QUERY_TEMPLATE = 'http://search.tianya.cn/bbs?q={key}&pn={page}&s=6&f=3'
        self.DEFAULT_PAGE_SIZE = 75
        self.DAYS = 7

        self.S2QUERY_FIRST_PAGE = 'S2QUERY_FIRST_PAGE'
        self.S2QUERY_SECOND_PAGE = 'S2QUERY_SECOND_PAGE'
        self.S2QUERY_EACH_PAGE = 'S2QUERY_EACH_PAGE'
 def __init__(self):
     SiteS2Query.__init__(self)
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     self.fakeoriginalurl = 'http://baozou.com/'
     self.queryUrl = 'http://zhannei.baidu.com/cse/search?q={keyword}&p={page}&s=8807869111209310469&entry=1'
     self.pageUrl = self.queryUrl
     self.maxPage = 76
     self.pageSize = 10.0
     self.STEP_PAGES = None
     self.STEP_ARTICLES_OR_VIDEOS = 1
     self.reArticle = '^http://baozou\.com/articles/\S*'
     self.reVideo = '^http://baozou\.com/videos/\S*'
 def __init__(self, post_url, parent=None):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = post_url
     self.r = RegexUtility()
     #self.post_url = BBSS2PostQuery.POST_URL
     self.post_url = post_url
     self.queryinfo = ''
     if parent:
         self.website = parent.website
     self.headers = {
         'User-Agent':
         'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/56.0.2924.87 Safari/537.36',
         'Accept-Encoding': 'gzip, deflate, sdch'
     }
    def __init__(self, parent=None):
        """Constructor"""
        SiteS2Query.__init__(self)
        self.fakeoriginalurl = 'https://ac.qq.com/'
        self.ORIGINAL_QUERY_TEMPLATE = 'https://v.qq.com/x/search/?q={key}'
        self.QUERY_TEMPLATE = 'https://v.qq.com/x/search/?ses={session}&q={key}&filter={ufilter}&cur={page_size}'
        self.AC_QUERY_TEMPLATE = 'http://ac.qq.com/Comic/searchList/search/{key}/page/{page_size}'
        self.QUERY_TEMPLATE_FILTER = 'sort={0}&pubfilter={1}&duration={2}&tabid={3}'
        self.DEFAULT_PAGE_SIZE = 28

        self.AC_QUERY = None
        self.AC_FIRST = 'AC_FIRST'
        self.AC_EACH = 'AC_EACH'
        if parent:
            self.website = parent.website
    def __init__(self, parent=None):
        # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
        SiteS2Query.__init__(self)
        self.fakeoriginalurl = 'http://v.qq.com/'
        self.ORIGINAL_QUERY_TEMPLATE = 'https://v.qq.com/x/search/?q={key}'
        self.QUERY_TEMPLATE = 'https://v.qq.com/x/search/?ses={session}&q={key}&filter={ufilter}&cur={page_size}'
        self.AC_QUERY_TEMPLATE = 'http://ac.qq.com/Comic/searchList/search/{key}/page/{page_size}'
        self.QUERY_TEMPLATE_FILTER = 'sort={0}&pubfilter={1}&duration={2}&tabid={3}'
        self.DEFAULT_PAGE_SIZE = 28

        #searchid表示时间,一周内时设置为9,orderby表示最新回复时间,kw表示搜索关键字,page表示页面
        #self.BOOK_QUERY_TEMPLATE = 'http://bbs.book.qq.com/search.php?mod=forum&searchid={searchid}&orderby=lastpost&ascdesc=desc&searchsubmit=yes&kw={key}&p={page}'

        self.TV_FIRST = 'TV_FIRST'
        self.TV_SECOND = 'TV_SECOND'
        self.TV_EACH = 'TV_EACH'
        if parent:
            self.website = parent.website
 def __init__(self):
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://bbs.gfan.com.cn/android-8342764-1-1.html'
     self.page_size = 10
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://www.52tian.net/'
     self.querylastdays = SpiderConfigure.getinstance().getlastdays()
     self.r = RegexUtility()
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'https://my.hupu.com/'
Example #15
0
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://video.sina.com.cn/'
Example #16
0
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://v.ifeng.com/'
 def __init__(self, parent=None):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://www.duowan.com/'
     if parent:
         self.website = parent.website
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://forum.home.news.cn/'
     self.r = RegexUtility()
 def __init__(self):
     """Constructor"""
     SiteS2Query.__init__(self)
     self.post_url = 'http://bbs.dmzj.com/search.php?mod=forum'
     self.get_url = 'http://donghua.dmzj.com'
     pass
 def __init__(self):
     SiteS2Query.__init__(self)
     self.r = RegexUtility()
     self.fakeoriginalurl='http://www.renren001.cc/search/serach'
     self.querylastdays = SpiderConfigure.getinstance().getlastdays()
 def __init__(self):
     SiteS2Query.__init__(self)
     self.r = RegexUtility()
     self.fakeoriginalurl = 'http://www.acfun.cn/v/'
     self.querylastdays = SpiderConfigure.getinstance().getlastdays()
 def __init__(self, parent):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'https://tieba.baidu.com'
     self.r = RegexUtility()
     self.website = parent.website
Example #23
0
 def __init__(self):
     SiteS2Query.__init__(self)
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     self.fakeoriginalurl = 'http://v.huya.com/'
     self.querylastdays = SpiderConfigure.getinstance().getlastdays()
     self.r = RegexUtility()
Example #24
0
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http[s]{0,1}://www.fun.tv/'
 def __init__(self):
     SiteS2Query.__init__(self)
     self.r = RegexUtility()
     self.fakeoriginalurl = 'http://cartoon.pptv.com/'
Example #26
0
 def __init__(self):
     SiteS2Query.__init__(self)
     self.r = RegexUtility()
     self.pagelimit = self.maxpages
     self.fakeoriginalurl = 'http://bbs.pcgames.com.cn/topic-7979.html'
     self.querylastdays = SpiderConfigure.getinstance().getlastdays()
Example #27
0
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://comic.ku6.com'
     self.r = RegexUtility()
Example #28
0
 def __init__(self,parent=None):
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://news.sogou.com'        
     self.page_size = 10 
     if parent:
         self.website = parent
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://www.narutom.com/'
     self.r = RegexUtility()
Example #30
0
 def __init__(self):
     # 使用该URL识别回传S2查询结果的类,推荐使用主站URL
     SiteS2Query.__init__(self)
     self.fakeoriginalurl = 'http://bbs.laohu.com/'
     self.r = RegexUtility()
     self.inputtime = self.querylastdays