def get_info(id): data = {'username': '******', 'password': '******'} url = 'http://informatics.mccme.ru/login/index.php' #browser = webdriver.Chrome('/Users/mihail/Desktop/chromedriver') #browser.get(url) #request_cookies_browser = browser.get_cookies() #s = requests.Session() #c = [s.cookies.set(c['name'], c['value']) for c in request_cookies_browser] #resp = s.post(url, data) #dict_resp_cookies = resp.cookies.get_dict() #response_cookies_browser = [{'name': name, 'value': value} for name, value in dict_resp_cookies.items()] #c = [browser.add_cookie(c) for c in response_cookies_browser] #browser.get(url) #html = browser.page_source #browser.get('http://informatics.mccme.ru/submits/view.php?user_id=' + id) #WebDriverWait(browser, 10).until( # ajax_complete, "Timeout waiting for page to load") #html = browser.page_source browser = Browser() browser.load('http://informatics.mccme.ru/submits/view.php?user_id=' + id) browser.wait_load() html = browser.html print(html)
def __init__(self, source_lang, target_lang, translate_type='headless'): self.source_lang = source_lang self.target_lang = target_lang # instantiate the relevant browser for the instance self.headless_browser = self.driver = None if translate_type == 'headless': self.headless_browser = Browser() self.headless_browser.set_html_parser(PyQuery) elif translate_type == 'selenium': self.driver = webdriver.Firefox() # determine the kind of translator needed self.translate = { 'simple': self.translate_simple, 'headless': self.translate_text_google_headless, 'selenium': self.translate_text_google }[translate_type]
def process_request(self, request, spider): browser = Browser() browser.create_webview() browser.set_html_parser(PyQuery) browser.load(request.url, 20) try: browser.wait_load(10) except: print '###########ERROR###########' pass body = browser.html body = body.encode('utf-8') renderedBody = str(body) return HtmlResponse(request.url, body=renderedBody)
# # app = QApplication(sys.argv) # web = QWebView() # web.load(QUrl(url)) # f = lambda x: x # # QObject.connect(web, SIGNAL("loadFinished"), f(4)) # # import mechanize # url = "http://www.spanishenglish.com/" # browser = mechanize.Browser() # browser.set_handle_robots(False) # browser.open(url) from spynner import Browser browser = Browser() from pyquery import PyQuery browser.set_html_parser(PyQuery) url = "http://www.spanishenglish.com/" browser.load(url) print "LOADED" browser.click("a[href='#en']", wait_load=False) browser.click("#LangPair_ToDDL tbody tr td a[href='#de']", wait_load=False) browser.wk_fill("#InputText", "How are you doing today?") browser.click_ajax("#TranslateButton") import time time.sleep(15) result_box = browser.soup('#TranslationOutput')[0] translated_text = result_box.text_content() # browser.show() time.sleep(30)