Python language Examples

Programming Language: Python

Namespace/Package Name: train

Method/Function: language

Examples at hotexamples.com: 6

Python language - 6 examples found. These are the top rated real world Python examples of train.language extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

File: langid.py Project: viswavi/languageid

def index(text):
        valid = train.valid
        corp = train.corp
        models = map(lambda code: kenlm.LanguageModel('lm/' + code + ".binary"), corp)
        langs = dict(valid) 
        text = text.lower()
        results = train.language(models,text)
        persistent = results
        return "(" + langs[results[0]] + "," + str(results[1]) + ")"

Example #2

Show file

def index(text):
    valid = train.valid
    corp = train.corp
    models = map(lambda code: kenlm.LanguageModel('lm/' + code + ".binary"),
                 corp)
    langs = dict(valid)
    text = text.lower()
    results = train.language(models, text)
    persistent = results
    return "(" + langs[results[0]] + "," + str(results[1]) + ")"

Example #3

Show file

File: langid.py Project: viswavi/languageid

def test():
    counts = {}
    for c in corp:
        right = 0
        wrong = 0
        wrongs = defaultdict(int)
        text = io.open('testcorpus/' + c, encoding='utf-8').read()
        #because Chinese is logographic, so tokenizing by space is inappropriate
        text = text.split()
        for i in random.sample(range(1, len(text)-23), 1000):
            inds = map(lambda j: i + j, range(random.randint(1, 24)))
            randogram = map(lambda j: text[j], inds)
            ans = train.language(models, ' '.join(randogram))[0]
            if(ans != c): wrong += 1
            else: right += 1
            counts[c] = (right, wrong)
    return counts

Example #4

Show file

def test():
    counts = {}
    for c in corp:
        right = 0
        wrong = 0
        wrongs = defaultdict(int)
        text = io.open('testcorpus/' + c, encoding='utf-8').read()
        #because Chinese is logographic, so tokenizing by space is inappropriate
        text = text.split()
        for i in random.sample(range(1, len(text) - 23), 1000):
            inds = map(lambda j: i + j, range(random.randint(1, 24)))
            randogram = map(lambda j: text[j], inds)
            ans = train.language(models, ' '.join(randogram))[0]
            if (ans != c): wrong += 1
            else: right += 1
            counts[c] = (right, wrong)
    return counts

Example #5

Show file

File: application.py Project: viswavi/languageid

def hello(text):
#       return str(train.models[0].order)
        l = train.language(train.models, text)
        return "(" +l[0] + ", " + str(l[1]) + ")"

Example #6

Show file

File: application.py Project: viswavi/languageid

def hello(text):
    #       return str(train.models[0].order)
    l = train.language(train.models, text)
    return "(" + l[0] + ", " + str(l[1]) + ")"