def __init__(self, url): self.browser = WebBrowser() self.browser.get(url) # Check for forbidden access server_response = normalize( self.browser.find_element_by_css_selector("div[id='header']").text) if server_response == "Server Error": self.browser.quit() raise ForbiddenAccessError self.table = {} self.timeout = 300
def __init__(self, url, skip, batch): self.browser = WebBrowser() self.browser.get(url) # Check for forbidden access server_response = normalize( self.browser.find_element_by_css_selector("div[id='header']").text) if server_response == "Server Error": self.browser.quit() raise ForbiddenAccessError self.match_reports = {'reports': []} self.timeout = 300 # Wait for 300s for elements to load on the page self.skip = skip # Number of fixtures to skip self.batch_size = batch # Number of fixtures to crawl in one go