コード例 #1
0
ファイル: cca.py プロジェクト: karlstratos/cca
def main(args):
    set_quiet(args.quiet)
    
    if args.corpus: 
        unigrams = count_unigrams(args.corpus)
        vocab, outfname = decide_vocab(unigrams, args.cutoff, 
                                       args.vocab, args.want)
        if args.rewrite: 
            rewrite_corpus(args.corpus, vocab, outfname)
        else:
            extract_stat(args.corpus, vocab, outfname, args.window)
    
    if args.stat:
        assert(args.m is not None and args.kappa is not None)
        if args.no_matlab:        
            C = canon()
            C.set_params(args.m, args.kappa)     
            C.get_stat(args.stat)
            C.start_logging()
            C.approx_cca()
            C.end_logging()
            C.write_result()
        else:
            call_matlab(args.stat, args.m, args.kappa)
        
    if args.clean: clean()
コード例 #2
0
def main(args):
    set_quiet(args.quiet)

    if args.corpus:
        unigrams = count_unigrams(args.corpus)
        vocab, outfname = decide_vocab(unigrams, args.cutoff, args.vocab,
                                       args.want)
        if args.rewrite:
            rewrite_corpus(args.corpus, vocab, outfname)
        else:
            extract_stat(args.corpus, vocab, outfname, args.window)

    if args.stat:
        assert (args.m is not None and args.kappa is not None)
        if args.no_matlab:
            C = canon()
            C.set_params(args.m, args.kappa)
            C.get_stat(args.stat)
            C.start_logging()
            C.approx_cca()
            C.end_logging()
            C.write_result()
        else:
            call_matlab(args.stat, args.m, args.kappa)

    if args.clean: clean()
コード例 #3
0
import os
import sys
from src.call_matlab import call_matlab
from src.canon import canon
from src.io import clean
from src.io import set_quiet
from src.strop import count_unigrams
from src.strop import decide_vocab
from src.strop import extract_stat

global corpus, cutoff, window, gold_Xcount, gold_Ycount, gold_XYcount
set_quiet(True)

# the dog saw the cat
# the dog barked
# the cat meowed
corpus = 'input/example/example.corpus'


# Check the counts in the above global variables.
def check():
    unigrams = count_unigrams(corpus)
    vocab, outfname = decide_vocab(unigrams, cutoff, None, None)
    XYcount, Xcount, Ycount, stat = extract_stat(corpus, vocab, outfname,
                                                 window)
    for x in Xcount:
        assert (Xcount[x] == gold_Xcount[x])
    for y in Ycount:
        assert (Ycount[y] == gold_Ycount[y])
    for x, y in XYcount:
        assert (XYcount[x, y] == gold_XYcount[x, y])
コード例 #4
0
ファイル: debug.py プロジェクト: karlstratos/cca
import os
import sys
from src.call_matlab import call_matlab
from src.canon import canon
from src.io import clean
from src.io import set_quiet
from src.strop import count_unigrams
from src.strop import decide_vocab
from src.strop import extract_stat

global corpus, cutoff, window, gold_Xcount, gold_Ycount, gold_XYcount
set_quiet(True)

# the dog saw the cat
# the dog barked
# the cat meowed
corpus = 'input/example/example.corpus'

# Check the counts in the above global variables.
def check():
    unigrams = count_unigrams(corpus)
    vocab, outfname = decide_vocab(unigrams, cutoff, None, None)
    XYcount, Xcount, Ycount, stat = extract_stat(corpus, vocab, 
                                                 outfname, window)
    for x in Xcount: assert(Xcount[x] == gold_Xcount[x])
    for y in Ycount: assert(Ycount[y] == gold_Ycount[y])
    for x, y in XYcount: assert(XYcount[x,y] == gold_XYcount[x,y])
    return stat 

# Case 1: cutoff = 0, window = 2
cutoff = 0