def freq(path): parsed = nlp030.mecab(path) dic = {} for sentence in parsed: for word in sentence: dic.setdefault(word['base'], 0) dic[word['base']] += 1 return dic
def main(path): parsed = nlp030.mecab(path) for sentence in parsed: for i in range(len(sentence)): try: if sentence[i]['surface'] == 'の': if sentence[i - 1]['pos'] == '名詞' and sentence[ i + 1]['pos'] == '名詞': print(sentence[i - 1]['surface'] + 'の' + sentence[i + 1]['surface']) except IndexError: pass
def main(path): parsed = nlp030.mecab(path) for sentence in parsed: for word in sentence: if word['pos'] == '名詞' and word['pos1'] == 'サ変接続': print(word['base'])
def main(path): parsed = nlp030.mecab(path) for sentence in parsed: for word in sentence: if word['pos'] == '動詞': print(word['surface'])