示例#1
0
    def __init__(self, postedUrlSet=None):
        BaseParser.__init__(self)

        self.baseurl = "http://news.163.com/rank/"
        #
        self.__postedUrlSet = postedUrlSet
        #要抽取的类别在页面中 div(.tabBox)的序号。根据这个抽取指定的信息块的url
        self.__typeIndexMap = {"ent": 5, "news": 1}
示例#2
0
 def __init__(self, postedUrlSet=None):
     BaseParser.__init__(self)
     
     self.baseurl = "http://news.163.com/rank/"     
     #
     self.__postedUrlSet = postedUrlSet
     #要抽取的类别在页面中 div(.tabBox)的序号。根据这个抽取指定的信息块的url
     self.__typeIndexMap = {
           "ent":5,
           "news":1
           }
示例#3
0
 def __init__(self, message):
     BaseParser.__init__(self, message)
     self.is_success()
示例#4
0
 def __init__(self, postedUrlSet=None):
     BaseParser.__init__(self)
     #已获取并发表的集合
     self.__postedUrlSet = postedUrlSet        
示例#5
0
 def __init__(self):
     BaseParser.__init__(self)
     self.name = "xiachufang"
     self.baseurl = "http://www.xiachufang.com/recipe/"
     #起始位置
     self.__start = 0
示例#6
0
 def __init__(self):
     BaseParser.__init__(self)
     self.name = "xiachufang"
     self.baseurl = "http://www.xiachufang.com/recipe/"        
示例#7
0
 def __init__(self, postedUrlSet=None):
     BaseParser.__init__(self)
     #已获取并发表的集合
     self.__postedUrlSet = postedUrlSet
示例#8
0
 def __init__(self, urlSet=None):
     BaseParser.__init__(self)
     
     self.baseUrl = "http://news.qq.com"
     self.oriUrl = "http://news.qq.com/newssh/qiwen.shtml"
     self.__postedSet = urlSet