Пример #1
0
    def __init__(self,
                 jvmpath=None,
                 userdic=None,
                 modelpath=None,
                 max_heap_size=1024):
        if not jpype.isJVMStarted():
            jvm.init_jvm(jvmpath, max_heap_size)

        if modelpath:
            self.modelpath = modelpath
        else:
            # FIXME: Cannot execute without sudoing
            # java.lang.NoClassDefFoundErrorPyRaisable: java.lang.NoClassDefFoundError: kr/co/shineware/nlp/komoran/core/analyzer/Komoran
            self.modelpath = os.path.join(utils.installpath, 'java', 'data',
                                          'models')
        self.tagset = utils.read_json('%s/data/tagset/komoran.json' %
                                      utils.installpath)

        komoranJavaPackage = jpype.JPackage('kr.co.shineware.nlp.komoran.core')

        try:
            self.jki = komoranJavaPackage.Komoran(self.modelpath)
        except TypeError:  # Package kr.lucypark.komoran.KomoranInterface is not Callable
            raise IOError(
                "Cannot access komoran-dic. Please leave an issue at https://github.com/konlpy/konlpy/issues"
            )

        if userdic:
            self.jki.setUserDic(userdic)
Пример #2
0
    def __init__(self, jvmpath=None, max_heap_size=1024):
        if not jpype.isJVMStarted():
            jvm.init_jvm(jvmpath, max_heap_size)

        oktJavaPackage = jpype.JPackage('kr.lucypark.okt')
        OktInterfaceJavaClass = oktJavaPackage.OktInterface
        self.jki = OktInterfaceJavaClass()
        self.tagset = utils.read_json('%s/data/tagset/twitter.json' % utils.installpath)
Пример #3
0
    def __init__(self, jvmpath=None):
        if not jpype.isJVMStarted():
            jvm.init_jvm(jvmpath)

        tktJavaPackage = jpype.JPackage('kr.lucypark.tkt')
        TktInterfaceJavaClass = tktJavaPackage.TktInterface
        self.jki = TktInterfaceJavaClass()
        self.tagset = utils.read_json('%s/data/tagset/twitter.json' % utils.installpath)
Пример #4
0
    def __init__(self, jvmpath=None, max_heap_size=1024):
        if not jpype.isJVMStarted():
            jvm.init_jvm(jvmpath, max_heap_size)

        jhannanumJavaPackage = jpype.JPackage('kr.lucypark.jhannanum.comm')
        HannanumInterfaceJavaClass = jhannanumJavaPackage.HannanumInterface
        self.jhi = HannanumInterfaceJavaClass()  # Java instance
        self.tagset = utils.read_json('%s/data/tagset/hannanum.json' % utils.installpath)
Пример #5
0
    def __init__(self, jvmpath=None, max_heap_size=1024):
        if not jpype.isJVMStarted():
            jvm.init_jvm(jvmpath, max_heap_size)

        kkmaJavaPackage = jpype.JPackage('kr.lucypark.kkma')
        KkmaInterfaceJavaClass = kkmaJavaPackage.KkmaInterface
        self.jki = KkmaInterfaceJavaClass()  # Java instance
        self.tagset = utils.read_json('%s/data/tagset/kkma.json' % utils.installpath)
Пример #6
0
    def __init__(self, jvmpath=None):
        if not jpype.isJVMStarted():
            jvm.init_jvm(jvmpath)

        kkmaJavaPackage = jpype.JPackage('kr.lucypark.kkma')
        KkmaInterfaceJavaClass = kkmaJavaPackage.KkmaInterface
        self.jki = KkmaInterfaceJavaClass()  # Java instance
        self.tagset = utils.read_json('%s/data/tagset/kkma.json' %
                                      utils.installpath)
Пример #7
0
        def __init__(self, dictionary_directory='C:/Apps/DISA3/resources/', max_heap_size=1024):
            jvmpath = jpype.getDefaultJVMPath()

            print(jpype.isJVMStarted())
            if not jpype.isJVMStarted():
                jvm.init_jvm(jvmpath, max_heap_size)

            sentence = "안녕하세요 diquest 어재현입니다. 저는 1988년 3월 28일에 태어났습니다."

            jianaDicPath = dictionary_directory + "jiana/dic/korean/dcd"
            plotDicPath = dictionary_directory + "plot/dic/korean/dcd"
            disaDicPath = dictionary_directory + "disa/dic/korean/dcd"
            category = "SUBWAY_STATION"

            """ step 1 : disa init """
            disaPackage = jpype.JPackage('com.diquest.disa')
            self.jDisa = disaPackage.DISA()
            self.jDisa.init(disaDicPath, plotDicPath, jianaDicPath, category)
    print_out_srs(srs)
    #makeDic_w2v(srs)
    tokenized_srs, tokenized_usecase = makeDic(srs)
    print(tokenized_usecase)
    final_srs = srs_analysis(tokenized_srs)
    #print(final_srs)
    # for reqId in list(final_srs.keys()):
    #     print('-----',reqId,'-----')
    #     try :
    #         o_ds_list = final_srs.get(reqId)
    #         for o_ds in o_ds_list:
    #             print('  [',o_ds.ilvl,']',end=' ')
    #             for w in o_ds.words:
    #                 print(w,end=' ')
    #             print(' ',o_ds.template)
    #     except:
    #         pass
    c_row = srs_out(final_srs,doc_name)
    usecase_out(tokenized_usecase,doc_name,current_row=c_row)

if __name__ == "__main__":
    jvm.init_jvm()
    os.path.dirname(sys.argv[0])
    if len(sys.argv) > 1:
        doc_name = sys.argv[1]
    else :
        doc_name = '표적관리_SRS_full'
    doc = docx.Document(doc_name+'.docx')
    srs_parsing(doc,doc_name)

Пример #9
0
import logging

from konlpy import jvm
from konlpy.tag import Twitter

logger = logging.getLogger(__name__)


def main():
    """
        konlpy 사용시 주의 사항
        자바 설치 및 세팅 필요
        JAVA_HOME 세팅이 필요합니다.
        export JAVA_HOME=$(/usr/libexec/java_home)
    """
    konl = Twitter()
    file_path = '/Users/bongster/Downloads/20160528_jiana.csv'
    with open(file_path, 'rb') as csv_file:
        inforeader = csv.reader(csv_file)
        for row in inforeader:
            r = konl.pos(unicode(row[4], 'utf-8'), norm=True, stem=True)
            print '=' * 20
            for txt, post in r:
                print txt, post
            print '=' * 20


if __name__ == '__main__':
    jvm.init_jvm()
    main()
    def __init__(self, jvm_path=None, max_heap_size=1024):
        if not jpype.isJVMStarted():
            jvm.init_jvm(jvm_path, max_heap_size)

        oktPackage = jpype.JPackage('org.openkoreantext.processor')
        self.processor = oktPackage.OpenKoreanTextProcessorJava()