コード例 #1
0
def test_mutil_sent_trans():
    en = 'hello. china.'
    translator = Translator.translator(src='en', dest='fr')
    rep = translator.translate('hello. china.', multi=True)
    print(rep)
    assert rep[0][0].lower() == 'bonjour. '
    assert rep[1][0].lower() == 'chine.'
コード例 #2
0
def test_translation():
    en = 'china'
    fr = 'chine'
    translator = Translator.translator(src='en', dest='fr')
    out = translator.translate(en)
    print(out)
    assert out.lower() == fr
コード例 #3
0
ファイル: google_trans_v2.py プロジェクト: yuanhuiru/xnr2
 def trans(self, q):
     try:
         translator = TS.translator(src='auto', dest=self.toLang)
         text = translator.translate(q)
         return text
     except Exception,e:
         print 'google_trans_v2 Exception: ', str(e)
         return False
def google_translate(token, content, from_lang='auto', to_lang='en'):
    from GoogleFreeTrans import Translator
    content = content.lower().replace('\n', ' ')
    try:
        translator = Translator.translator(src=from_lang, dest=to_lang)
        dst = translator.translate(content)
    except:
        print('from', content, 'to', 'error')
    else:
        if dst != None and len(dst) > 10:
            ''' save the english tweets, the similarity of tweet and translated one should be low than 0.5 '''
            ratio = difflib.SequenceMatcher(None, content, dst).quick_ratio()
            if ratio < 0.5 and judLanguage(dst) == 'en':
                # print('from', content, 'to', dst)
                return dst
    return ""
コード例 #5
0
    def translate(self):
        translator = Translator.translator('fa', 'en')
        key_word = {"اگر": "if", "وگر": "elif", "وگرنه": "else", "واردکن": "import", "کلاس": "class",
                    "تعریف": "def", "تازمانیکه": "while", "برای": "for", "در": "in", "نه": "not",
                    "و": "and", "یا": "or", "برگردان": "return", "چاپ": "print", "ادامه": "continue", "توقف": "break"}
        sybols = [":", "<", "<", "=", "==", "+", "_", "*", "**", "(", ")", "[", "]", "{", "}", "\\", "\"", "\'", "\n",
                  "<=",
                  "<>", ">=", "#", ""]

        codeTextPersian = self.srcTextEdit.toPlainText()
        codeWordsPersian = codeTextPersian.replace(" ", " s ").replace("\n", " n ").replace("\t", " t ").split(" ")
        englishCode = ""
        word_dict = {}
        for word in codeWordsPersian:
            if word in key_word.keys():
                word_dict[key_word[word]] = word
                englishCode += key_word[word]
            elif word in sybols:
                word_dict[word] = word
                englishCode += word
            elif word == "s":
                englishCode += " "
            elif word == "n":
                englishCode += "\n"
            elif word == "t":
                englishCode += "\t"
            else:

                newWord = 'ـ'.join(translator.translate(word).split(" "))
                word_dict[newWord] = word
                englishCode += newWord
        print(word_dict)
        lex = lexer.lexer(englishCode)
        lex = lex.split("\n")
        finalCode = ""
        for line in lex:
            l = line.split(" |")
            if l[0] in word_dict.keys():
                if len(l) > 1:

                    finalCode += str(word_dict[l[0]]) + " |" + l[1] + "\n"
        self.destTextEdit.setPlainText(finalCode)
        finalFile = open("englishCode.txt", "w")
        finalFile.write(englishCode)
コード例 #6
0
def visitURL(base_url):
    # base_url = "https://mp.weixin.qq.com/s?src=11&timestamp=1586779202&ver=2276&signature=Hu*YxuJwLetW6Eu24Hju2QRQyiQten3BK8ER9i92SnqBja57Pbn*MLtAb8XEMKpPs0nLxl8IU3T6TRck1EGWlPYLfGBBy8pKPXKqSeHv-Oc=&new=1"

    html = urllib.request.urlopen(base_url).read()
    data = parsel.Selector(str(html))
    text = data.xpath('//div[@class="rich_media_content "]/p/text()').extract()
    if not text:
        print("None,change filter2")
        text = data.xpath(
            '//section[@data-bcless="lighten"]//span/text()').extract()

    if not text:
        print("None,change filter3")
        text = data.xpath(
            '//div[@class="rich_media_content "]//section/text()').extract()

    if not text:
        print("None,change filter4")
        text = data.xpath(
            '//div[@class="rich_media_content "]/text()').extract()

    translator = Translator.translator(src='zh-CN', dest='en')

    page_content = ""
    if not text:
        print("empty response")
        return page_content

    for item in text:
        text_split = item.split('\\')[1:]

        raw_paper_sentence = getSentence(text_split)
        transed_paper_sentence = translator.translate(raw_paper_sentence)
        # print(raw_paper_sentence+'\n'+transed_paper_sentence)

        page_content += transed_paper_sentence

    return page_content
コード例 #7
0
def test_special_chars():
    text = u"©×《》"
    translator = Translator.translator(src='en', dest='en')
    rep = translator.translate(text)
    print(rep)
    assert rep == text
コード例 #8
0
def test_unicode():
    translator = Translator.translator(src='ko', dest='ja')
    result = translator.translate('안녕하세요.')
    print(result)
    assert result == u'こんにちは。'
コード例 #9
0
# utils = rpackages.importr('utils')
# # select a mirror for R packages
# utils.chooseCRANmirror(ind=1) # select the first mirror in the list
# # R package names
# packnames = ('fpp', 'forecast')
# # R vector of strings
# from rpy2.robjects.vectors import StrVector
# # Selectively install what needs to be install.
# if len(packnames) > 0:
#     utils.install_packages(StrVector(packnames))

# predict total sales for every product and store for the next month

sns.set()

translator = Translator.translator(src='ru', dest='en')

item_cat_df = pd.read_csv('item_categories.csv', sep=',', index_col=0)
items_df = pd.read_csv('items.csv', sep=',', index_col=0)
sales_train_df = pd.read_csv('sales_train.csv', sep=',', index_col=0)
sample_submission_df = pd.read_csv('sample_submission.csv',
                                   sep=',',
                                   index_col=0)
shops_df = pd.read_csv('shops.csv', sep=',', index_col=0)
test_df = pd.read_csv('test.csv', sep=',', index_col=0)

eng_item_cat_df = pd.read_csv('eng_item_categories.csv', sep=',', index_col=0)
eng_item_cat_df.columns = ['item_category_id']
eng_shops_df = pd.read_csv('eng_shops.csv', sep=',', index_col=0)

sales_train_df.describe()
コード例 #10
0
ファイル: translator_2.py プロジェクト: taiditek/PythonDemo
def translate(str, lan):
    # translator = Translator.translator(src='en', dest='zh-CN')
    translator = Translator.translator(src='en', dest=lan)
    result = translator.translate(str)
    # print(result)
    return result
コード例 #11
0
def parser(appid, appname, zone):
    print("[" + appname + "]")
    page = 1
    count = 0
    translator = Translator.translator(src='auto', dest='zh-CN')
    # 默认循环10次,获取500条数据
    while page < 11:
        myurl = "https://itunes.apple.com/" + zone + "/rss/customerreviews/page=" + str(
            page) + "/id=" + str(appid) + "/sortby=mostrecent/xml"
        response = requests.request("GET", myurl)
        xmlstr = response.text
        xmlparse = xmltodict.parse(xmlstr)
        myjson = json.loads(json.dumps(xmlparse, indent=1))
        print(myurl)
        if "entry" in myjson["feed"]:
            count += len(myjson["feed"]["entry"])
            for i in myjson["feed"]["entry"]:
                # (id) id - i["id"]
                id = i["id"]
                # (时间) time - i["updated"]
                updated = i["updated"]
                # (用户) name - i["author"]["name"]
                name = i["author"]["name"]
                # (标题) title - i["title"]
                title = i["title"]
                # (内容) content - i["content"]
                content = ''
                contentTrans = ''
                for c in i["content"]:
                    if c["@type"] == "text":
                        content = c["#text"]
                # (评分) rating - i["im:rating"]
                rating = i["im:rating"]
                # (版本) im:version - i["im:version"]
                version = i["im:version"]
                payload = {
                    'review': {
                        "id": int(id),
                        "author": name,
                        "title": title,
                        "titleTrans": translator.translate(title),
                        "contentTrans": translator.translate(content),
                        "content": content,
                        "star": int(rating),
                        "time": updated,
                        "appId": appid,
                        "appName": appname,
                        "appVersion": version,
                        "language": zone
                    }
                }
                payload = json.dumps(payload)
                print(payload)
                # TODO
            page = page + 1
        else:
            break
    if count == 0:
        print("未获取到任何数据。")
    else:
        print(str(count) + "条数据")
コード例 #12
0
# coding=utf-8
# @Time    : 2019/8/13 14:37
# @Author  : zwa

from GoogleFreeTrans import Translator

translator = Translator.translator(src='en', dest='zh-CN')

print(
    translator.translate(
        '<p style="box-sizing: border-box; margin: 0px 0px 26px; border: 0px; font-family: Roboto, Arial, sans-serif; caret-color: #333333; color: #333333; -webkit-tap-highlight-color: rgba(0, 0, 0, 0); -webkit-text-size-adjust: 100%;"><strong style="box-sizing: border-box; border: 0px;">Location:  La Paz</strong></p><p style="box-sizing: border-box; margin: 0px 0px 26px; border: 0px; font-family: Roboto, Arial, sans-serif; caret-color: #333333; color: #333333; -webkit-tap-highlight-color: rgba(0, 0, 0, 0); -webkit-text-size-adjust: 100%;"><strong style="box-sizing: border-box; border: 0px;"><span style="box-sizing: border-box; border: 0px;">Event:</span></strong><span style="box-sizing: border-box; border: 0px;">  </span>La Paz transportation unions announced a city-wide strike and protest starting Monday, July 15, at 6 a.m. which could result in road blockades, transportation disruptions, and demonstrations. These activities could affect the availability of public transportation in the city of La Paz and connections with other cities and on major roads in Bolivia. The Embassy is expected to be open for normal operations, however, applicants for consular services that are unable to reach the Embassy due to the strike activity may contact the Embassy and will have their appointments rescheduled for another day.</p><p style="box-sizing: border-box; margin: 0px 0px 26px; border: 0px; font-family: Roboto, Arial, sans-serif; caret-color: #333333; color: #333333; -webkit-tap-highlight-color: rgba(0, 0, 0, 0); -webkit-text-size-adjust: 100%;"><strong style="box-sizing: border-box; border: 0px;">Actions to Take:</strong></p><ul style="box-sizing: border-box; margin: 0px 0px 23px; border: 0px; font-family: Roboto, Arial, sans-serif; display: inline-block; caret-color: #333333; color: #333333; -webkit-tap-highlight-color: rgba(0, 0, 0, 0); -webkit-text-size-adjust: 100%;"><li style="box-sizing: border-box; border: 0px;">Monitor the ABC website for official reports of traffic disruptions at <a href="http://transitabilidad.abc.gob.bo/mapa/" target="_blank" rel="noopener noreferrer" shape="rect" style="box-sizing: border-box; color: #5d759b; text-decoration: none; border: 0px; transition: all 0.5s ease;">http://transitabilidad.abc.gob.bo/mapa/</a>.</li><li style="box-sizing: border-box; border: 0px;">Avoid roadblocks and exercise caution if in the vicinity of any large gatherings or protests.</li><li style="box-sizing: border-box; border: 0px;">Do not attempt to pass through roadblocks forcibly.</li><li style="box-sizing: border-box; border: 0px;">Plan for alternate travel routes or remain in place if planned travel is inhibited.</li><li style="box-sizing: border-box; border: 0px;">Monitor local media for updates on road conditions.</li></ul><p style="box-sizing: border-box; margin: 0px 0px 26px; border: 0px; font-family: Roboto, Arial, sans-serif; caret-color: #333333; color: #333333; -webkit-tap-highlight-color: rgba(0, 0, 0, 0); -webkit-text-size-adjust: 100%;"><strong style="box-sizing: border-box; border: 0px;"><span style="box-sizing: border-box; border: 0px;">Assistance:</span></strong></p><p style="box-sizing: border-box; margin: 0px 0px 26px; border: 0px; font-family: Roboto, Arial, sans-serif; caret-color: #333333; color: #333333; -webkit-tap-highlight-color: rgba(0, 0, 0, 0); -webkit-text-size-adjust: 100%;"><a href="https://ec.usembassy.gov/u-s-citizen-services/" target="_blank" rel="noopener noreferrer" shape="rect" style="box-sizing: border-box; color: #5d759b; text-decoration: none; border-width: 0px 0px 1px; border-bottom-style: dotted; border-bottom-color: #003875; transition: all 0.5s ease;"><span style="box-sizing: border-box; border: 0px;">U.S. Embassy La Paz, Bolivia</span></a></p><p style="box-sizing: border-box; margin: 0px 0px 26px; border: 0px; font-family: Roboto, Arial, sans-serif; caret-color: #333333; color: #333333; -webkit-tap-highlight-color: rgba(0, 0, 0, 0'
    ))

tran1 = Translator.translator(src='tr', dest='zh-CN')

print(tran1.translate('Focus Antitrust'))
コード例 #13
0
from GoogleFreeTrans import Translator
translator = Translator.translator()
# print(translator.translate(
#     'A Generative Approach to Zero-Shot and Few-Shot Action Recognition'))

import os
import sys
path0 = r"C:\Users\think\Desktop\零样本学习"
path1 = r"C:\Users\think\Desktop\零样本学习"+'\\'

sys.path.append(path1)
print(sys.path)

# 列出当前目录下所有的文件
files = os.listdir(path0)

# files = os.listdir('.')

print('files', files)

for filename in files:
    portion = os.path.splitext(filename)
    print(portion[0])
    # 如果后缀是.txt
    if portion[1] == ".pdf":
        # 重新组合文件名和后缀名
        temp=translator.translate(portion[0])
        newname = temp + ".pdf"
        filenamedir = path1 + filename
        newnamedir = path1+newname