#!/usr/bin/python
#-*-coding:utf-8-*-
#2015/05/27 16:54:01 Shin Kanouchi

import argparse
import knock030


def main(doc):
    for sent in doc:
        nouns = list()
        for m in sent:
            if m['pos'] == '名詞':
                nouns.append(m['surface'])
            elif nouns:
                print ' '.join(nouns)
                nouns = list()

if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument('-t', '--train', dest='train', default='../data/neko.mecab', help='input training data')
    args = parser.parse_args()
    my_morphs = knock030.get_morphs(args.train)
    main(my_morphs)
#!/usr/bin/python
#-*-coding:utf-8-*-
#2015/05/27 16:44:17 Shin Kanouchi

import argparse
import knock030


def main(doc):
    for sent in doc:
        for m in sent:
            if m['pos'] == '名詞' and m['pos1'] == 'サ変接続':
                print(m['base'])


if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument('-t',
                        '--train',
                        dest='train',
                        default='../data/neko.txt.mecab',
                        help='input training data')
    args = parser.parse_args()
    my_morphs = knock030.get_morphs(args.train)
    main(my_morphs)
Example #3
0
# coding:utf-8
'''
python knock032.py ../Data/neko.txt.mecab
'''

import sys
import knock030 as marujirou

doc = marujirou.get_morphs(sys.argv[1])

for sent in doc:
    for m in sent:
        if m['pos'] == '動詞':
            print m['base']