def reset(self):
     self.infos = {}
     self.files = {}
     self.redirected = {}
     self.alias_bases = {}
     self.sortorder = {}
     self.counter = 0
     Checker.reset(self)
     self.urlopener = CachingURLopener(cache = self.cache, site_url=self.site_url)
 def __setstate__(self, state):
     self.reset()
     try:
         cstate,mystate = state
         Checker.__setstate__(self,cstate)
         self.infos, self.files, self.redirected, self.html_cache = mystate
     except:
         pass
     self.resetRun()
 def reset(self):
     self.infos = {}
     self.files = {}
     self.redirected = {}
     self.alias_bases = {}
     self.html_cache = {}
     self.sortorder = {}
     self.counter = 0
     Checker.reset(self)
Example #4
0
 def reset(self):
     self.infos = {}
     self.files = {}
     self.redirected = {}
     self.alias_bases = {}
     self.sortorder = {}
     self.counter = 0
     Checker.reset(self)
     self.urlopener = CachingURLopener(cache=self.cache,
                                       site_url=self.site_url)
 def readhtml(self, url_pair):
     if url_pair in self.html_cache:
         return self.html_cache[url_pair]
     else:
         res = Checker.readhtml(self, url_pair)
         self.html_cache[url_pair] = res
         return res
Example #6
0
 def isallowed(self, root, url):
     if self.ignore_robots:
         return True
     return Checker.isallowed(self, root, url)
Example #7
0
 def readhtml(self, url_pair):
     res = Checker.readhtml(self, url_pair)
     return res
 def isallowed(self, root, url):
     if self.ignore_robots:
         return True
     return Checker.isallowed(self, root, url)
 def readhtml(self, url_pair):
     res = Checker.readhtml(self, url_pair)
     return res
 def __getstate__(self):
     mystate = self.infos, self.files, self.redirected, self.html_cache
     return (Checker.__getstate__(self),mystate)