示例#1
0
文件: lsa_test.py 项目: zxsted/finch
from lsa import LSA

if __name__ == '__main__':
    documents = [line.rstrip() for line in open('temp/all_book_titles.txt')]

    stopwords = set(line.rstrip()
                    for line in open('temp/stopwords.txt')).union({
                        'introduction', 'edition', 'series', 'application',
                        'approach', 'card', 'access', 'package', 'plus',
                        'etext', 'brief', 'vol', 'fundamental', 'guide',
                        'essential', 'printed', 'third', 'second', 'fourth'
                    })

    model = LSA(stopwords)
    model.fit(documents)
    model.plot()