if retries == 0: print "Can't reach firefly on port %d!" % self._port raise retries -= 1 time.sleep([30, 10, 2][retries]) return self._send_command(command, retries) def get_visual_elements(self, url): return self._send_command('GOTO %s' % url) ################ ## DEBUG CODE ## ################ if __name__ == '__main__': import firefox_startup if len(sys.argv) < 4: print "usage: %s profile port website" % argv[1] print sys.argv profile = sys.argv[1] port = int(sys.argv[2]) website = sys.argv[3] firefox_startup.startup_firefox(profile) print Firefly(port).get_visual_elements(website)
# quick argument sanity check if len(sys.argv) < 3: print 'usage: %s profile_name port' % sys.argv[0] sys.exit(1) # grab the command line args profile_name = sys.argv[1] profile_port = int(sys.argv[2]) # turn on headless environment #vd = Display(visible=0, size=(640,480)) #vd.start() # open a browsing window firefox_startup.startup_firefox(sys.argv[1]) # getting all the classes we need firefly = firefly.Firefly(profile_port) ############################################## ## ## ## Sample crawl (add desired functionality) ## ## ## ############################################## urls = ['www.google.com', 'www.nytimes.com', 'www.yahoo.com'] errors = 0