Example #1
0
	def start_fetch(self, url, level = 1):
		self.url = url
		result = getFetcher(self.url, self.uid, self.upwd).fetchData()
		subURLs = getSubTotalURLS(result, url)
		if (len(result) != 0):
			title = get_title(result)
			if (len(title) == 0): title = 'Default' + self.url
			# result = self.convert_html_to_content(result)
			result = partPage(result, 0)
			self.write_to_database(1, 1, title, result, self.url, level)
			# self.do_syscmd_reindexer()
		return subURLs
Example #2
0
 def start_fetch(self, url, level=1):
     self.url = url
     result = getFetcher(self.url, self.uid, self.upwd).fetchData()
     subURLs = getSubTotalURLS(result, url)
     if (len(result) != 0):
         title = get_title(result)
         if (len(title) == 0): title = 'Default' + self.url
         # result = self.convert_html_to_content(result)
         result = partPage(result, 0)
         self.write_to_database(1, 1, title, result, self.url, level)
         # self.do_syscmd_reindexer()
     return subURLs
Example #3
0
	def getSublinks(self, rawdata, baseurl):
		return getSubTotalURLS(rawdata, baseurl)