コード例 #1
0
def get_info(id):
    data = {'username': '******', 'password': '******'}
    url = 'http://informatics.mccme.ru/login/index.php'
    #browser = webdriver.Chrome('/Users/mihail/Desktop/chromedriver')

    #browser.get(url)
    #request_cookies_browser = browser.get_cookies()
    #s = requests.Session()
    #c = [s.cookies.set(c['name'], c['value']) for c in request_cookies_browser]
    #resp = s.post(url, data)
    #dict_resp_cookies = resp.cookies.get_dict()
    #response_cookies_browser = [{'name': name, 'value': value} for name, value in dict_resp_cookies.items()]
    #c = [browser.add_cookie(c) for c in response_cookies_browser]
    #browser.get(url)
    #html = browser.page_source
    #browser.get('http://informatics.mccme.ru/submits/view.php?user_id=' + id)
    #WebDriverWait(browser, 10).until(
    #    ajax_complete, "Timeout waiting for page to load")
    #html = browser.page_source

    browser = Browser()
    browser.load('http://informatics.mccme.ru/submits/view.php?user_id=' + id)
    browser.wait_load()
    html = browser.html

    print(html)
コード例 #2
0
    def __init__(self, source_lang, target_lang, translate_type='headless'):
        self.source_lang = source_lang
        self.target_lang = target_lang

        # instantiate the relevant browser for the instance
        self.headless_browser = self.driver = None
        if translate_type == 'headless':
            self.headless_browser = Browser()
            self.headless_browser.set_html_parser(PyQuery)
        elif translate_type == 'selenium':
            self.driver = webdriver.Firefox()

        # determine the kind of translator needed
        self.translate = {
            'simple': self.translate_simple,
            'headless': self.translate_text_google_headless,
            'selenium': self.translate_text_google
        }[translate_type]
コード例 #3
0
    def process_request(self, request, spider):
        browser = Browser()
        browser.create_webview()
        browser.set_html_parser(PyQuery)
        browser.load(request.url, 20)

        try:
            browser.wait_load(10)
        except:
            print '###########ERROR###########'
            pass

        body = browser.html

        body = body.encode('utf-8')

        renderedBody = str(body)

        return HtmlResponse(request.url, body=renderedBody)
コード例 #4
0
#
# app = QApplication(sys.argv)
# web = QWebView()
# web.load(QUrl(url))
# f = lambda x: x
# # QObject.connect(web, SIGNAL("loadFinished"), f(4))
#

# import mechanize
# url = "http://www.spanishenglish.com/"
# browser = mechanize.Browser()
# browser.set_handle_robots(False)
# browser.open(url)

from spynner import Browser
browser = Browser()
from pyquery import PyQuery
browser.set_html_parser(PyQuery)
url = "http://www.spanishenglish.com/"
browser.load(url)
print "LOADED"
browser.click("a[href='#en']", wait_load=False)
browser.click("#LangPair_ToDDL tbody tr td a[href='#de']", wait_load=False)
browser.wk_fill("#InputText", "How are you doing today?")
browser.click_ajax("#TranslateButton")
import time
time.sleep(15)
result_box = browser.soup('#TranslationOutput')[0]
translated_text = result_box.text_content()
# browser.show()
time.sleep(30)