def get_possible_translations(from_lang_code, to_lang_code):
    """

        Returns a list of possible translations in :param to_lang_code
        for :param word in :param from_lang_code.

        You must also specify the :param context, :param url, and :param title
         of the page where the word was found.

        The context is the sentence.

        :return: json array with translations

    """
    data = {"from_lang_code": from_lang_code, "to_lang_code": to_lang_code}
    data["context"] = request.form.get('context', '')
    url = request.form.get('url', '')
    data["url"] = url
    article_id = None
    if 'articleID' in url:
        article_id = url.split('articleID=')[-1]
        url = Article.query.filter_by(id=article_id).one().url.as_canonical_string()
    elif 'articleURL' in url:
        url = url.split('articleURL=')[-1]
    else:
        # the url comes from elsewhere not from the reader, so we find or creat the article
        article = Article.find_or_create(db_session, url)
        article_id = article.id
    zeeguu_core.log(f"url before being saved: {url}")
    word_str = request.form['word']
    data["word"] = word_str
    title_str = request.form.get('title', '')
    data["title"] = title_str

    zeeguu_core.log(f'translating to... {data["to_lang_code"]}')
    minimal_context, query = minimize_context(
        data["context"], data["from_lang_code"], data["word"])
    zeeguu_core.log(f"Query to translate is: {query}")
    data["query"] = query
    translations = get_all_translations(data).translations
    zeeguu_core.log(f"Got translations: {translations}")

    # translators talk about quality, but our users expect likelihood.
    # rename the key in the dictionary
    for t in translations:
        t['likelihood'] = t.pop("quality")
        t['source'] = t.pop('service_name')

    best_guess = translations[0]["translation"]

    Bookmark.find_or_create(db_session, flask.g.user,
                            word_str, from_lang_code,
                            best_guess, to_lang_code,
                            minimal_context, url, title_str, article_id)

    return json_result(dict(translations=translations))
def translate_and_bookmark(from_lang_code, to_lang_code):
    """

        @deprecated
        This should be deprecated and /get_possible_translations used instead
        However, it is still used by the zeeguu chrome extension.

        This expects in the post parameter the following:
        - word (to translate)
        - context (surrounding paragraph of the original word )
        - url (of the origin)
        - title (of the origin page)

        /get_possible_translations has very similar behavior, only that
          if focuses on returning the possible alternative translations

    :param from_lang_code:
    :param to_lang_code:
    :return:
    """

    data = {"from_lang_code": from_lang_code, "to_lang_code": to_lang_code}
    word_str = unquote_plus(request.form['word'])
    data["word"] = word_str
    url_str = request.form.get('url', '')
    data["url"] = url_str

    title_str = request.form.get('title', '')
    data["title"] = title_str
    context_str = request.form.get('context', '')
    data["context"] = context_str

    # the url comes from elsewhere not from the reader, so we find or creat the article
    article = Article.find_or_create(db_session, url_str)
    article_id = article.id

    try:

        minimal_context, query = minimize_context(
            data["context"], data["from_lang_code"], data["word"])
        data["query"] = query
        translations = get_all_translations(data).translations

        best_guess = translations[0]["translation"]

        bookmark = Bookmark.find_or_create(db_session, flask.g.user,
                                           word_str, from_lang_code,
                                           best_guess, to_lang_code,
                                           minimal_context, url_str, title_str, article_id)
    except ValueError as e:
        zeeguu_core.log(f"minimize context failed {e}on: {context_str} x {from_lang_code} x {word_str} ")
        return context_str, query

    return json_result(dict(
        bookmark_id=bookmark.id,
        translation=best_guess))
def contribute_translation(from_lang_code, to_lang_code):
    """
    
        User contributes a translation they think is appropriate for 
         a given :param word in :param from_lang_code in a given :param context

        The :param translation is in :param to_lang_code

        Together with the two words and the textual context, you must submit
         also the :param url, :param title of the page where the original
         word and context occurred.
    
    :return: in case of success, the bookmark_id and main translation

    """

    # All these POST params are mandatory
    word_str = unquote_plus(request.form['word'])
    translation_str = request.form['translation']
    url = request.form.get('url', '')
    context_str = request.form.get('context', '')
    title_str = request.form.get('title', '')
    # when a translation is added by hand, the servicename_translation is None
    # thus we set it to MANUAL
    service_name = request.form.get('servicename_translation', 'MANUAL')

    article_id = None
    if 'articleID' in url:
        article_id = url.split('articleID=')[-1]
        url = Article.query.filter_by(id=article_id).one().url.as_canonical_string()
    elif 'articleURL' in url:
        url = url.split('articleURL=')[-1]
    else:
        # the url comes from elsewhere not from the reader, so we find or creat the article
        article = Article.find_or_create(db_session, url)
        article_id = article.id

    # Optional POST param
    selected_from_predefined_choices = request.form.get('selected_from_predefined_choices', '')

    minimal_context, _ = minimize_context(context_str, from_lang_code, word_str)

    bookmark = Bookmark.find_or_create(db_session, flask.g.user,
                                       word_str, from_lang_code,
                                       translation_str, to_lang_code,
                                       minimal_context, url, title_str, article_id)
    # Inform apimux about translation selection
    data = {"word_str": word_str, "translation_str": translation_str,
            "url": url, "context_size": len(context_str),
            "service_name": service_name}
    contribute_trans(data)
    return json_result(dict(bookmark_id=bookmark.id))
Esempio n. 4
0
def get_one_translation(from_lang_code, to_lang_code):
    """

    Addressing some of the problems with the
    get_next_translations...
    - it should be separated in get_first and get_alternatives
    - alternatively it can be get one and get all

    To think about:
    - it would also make sense to separate translation from
    logging; or at least, allow for situations where a translation
    is not associated with an url... or?

    :return: json array with translations
    """

    word_str = request.form["word"]
    url = request.form.get("url")
    title_str = request.form.get("title", "")
    context = request.form.get("context", "")

    minimal_context, query = minimize_context(context, from_lang_code, word_str)

    translation = own_translation(
        flask.g.user, word_str, from_lang_code, to_lang_code, minimal_context
    )
    if translation:
        return json_result(dict(translations=translation))

    translations = get_next_results(
        {
            "from_lang_code": from_lang_code,
            "to_lang_code": to_lang_code,
            "url": request.form.get("url"),
            "word": word_str,
            "title": title_str,
            "query": query,
            "context": minimal_context,
        },
        number_of_results=1,
    ).translations

    # do we really need this?
    # translators talk about quality, but our users expect likelihood.
    # rename the key in the dictionary
    for t in translations:
        t["likelihood"] = t.pop("quality")
        t["source"] = t["service_name"]

    article_id = None
    if "article?id=" in url:
        article_id = url.split("article?id=")[-1]
        url = Article.query.filter_by(id=article_id).one().url.as_canonical_string()
    else:
        # the url comes from elsewhere not from the reader, so we find or creat the article
        article = Article.find_or_create(db_session, url)
        article_id = article.id

    if len(translations) > 0:
        best_guess = translations[0]["translation"]

        Bookmark.find_or_create(
            db_session,
            flask.g.user,
            word_str,
            from_lang_code,
            best_guess,
            to_lang_code,
            minimal_context,
            url,
            title_str,
            article_id,
        )

    return json_result(dict(translations=translations))
Esempio n. 5
0
def get_next_translations(from_lang_code, to_lang_code):
    """
    Returns a list of possible translations in :param to_lang_code
    for :param word in :param from_lang_code.

    You must also specify the :param context, :param url, and :param title
     of the page where the word was found.

    The context is the sentence.

    :return: json array with translations
    """

    data = {"from_lang_code": from_lang_code, "to_lang_code": to_lang_code}
    data["context"] = request.form.get("context", "")
    url = request.form.get("url", "")
    number_of_results = int(request.form.get("numberOfResults", -1))

    service_name = request.form.get("service", "")

    exclude_services = [] if service_name == "" else [service_name]
    currentTranslation = request.form.get("currentTranslation", "")

    exclude_results = [] if currentTranslation == "" else [currentTranslation.lower()]
    data["url"] = url
    article_id = request.form.get("articleID", None)

    if article_id == None:
        if "articleID" in url:
            article_id = url.split("articleID=")[-1]
            url = Article.query.filter_by(id=article_id).one().url.as_canonical_string()
        elif "articleURL" in url:
            url = url.split("articleURL=")[-1]
        else:
            # the url comes from elsewhere not from the reader, so we find or creat the article
            article = Article.find_or_create(db_session, url)
            article_id = article.id
    zeeguu_core.log(f"url before being saved: {url}")
    word_str = request.form["word"]
    data["word"] = word_str
    title_str = request.form.get("title", "")
    data["title"] = title_str

    zeeguu_core.log(f'translating to... {data["to_lang_code"]}')
    minimal_context, query = minimize_context(
        data["context"], data["from_lang_code"], data["word"]
    )
    zeeguu_core.log(f"Query to translate is: {query}")
    data["query"] = query

    first_call_for_this_word = len(exclude_services) == 0

    if first_call_for_this_word:
        translations = own_or_crowdsourced_translation(
            flask.g.user, word_str, from_lang_code, to_lang_code, minimal_context
        )
        if translations:
            return json_result(dict(translations=translations))

    translations = get_next_results(
        data,
        exclude_services=exclude_services,
        exclude_results=exclude_results,
        number_of_results=number_of_results,
    ).translations

    # translators talk about quality, but our users expect likelihood.
    # rename the key in the dictionary
    for t in translations:
        t["likelihood"] = t.pop("quality")
        t["source"] = t["service_name"]

    if len(translations) > 0 and first_call_for_this_word:
        best_guess = translations[0]["translation"]

        Bookmark.find_or_create(
            db_session,
            flask.g.user,
            word_str,
            from_lang_code,
            best_guess,
            to_lang_code,
            minimal_context,
            url,
            title_str,
            article_id,
        )

    return json_result(dict(translations=translations))