Beispiel #1
0
#! -*- coding: utf-8 -*-
import subprocess
from subprocess import Popen, PIPE, STDOUT
import multiprocessing
# socket object
import socket
# logger
from JapaneseTokenizer import init_logger
import logging
logger = init_logger.init_logger(logging.getLogger(init_logger.LOGGER_NAME))
# else
from six import text_type
import six
import pexpect
import shutil
import signal
import os
'''
class BaseServerHandler(object):
    """Base handler to use UNIX process as server process"""
    def __init__(self):
        # メンバ変数を定義しておく
        self._sock = None  # type: socket
        self._address = None  # type: str

    def __call__(self, serversocket):
        """"""
        # type: (socket)->None
        while True:
            # 接続を受ける
            (self._sock, self._address) = serversocket.accept()
# -*- coding: utf-8 -*-
from JapaneseTokenizer.common import text_preprocess
from JapaneseTokenizer.datamodels import FilteredObject, TokenizedResult, TokenizedSenetence
from JapaneseTokenizer.common import filter
from JapaneseTokenizer import init_logger
import logging
import sys

logger = init_logger.init_logger(logging.getLogger(init_logger.LOGGER_NAME))
python_version = sys.version_info

try:
    import Mykytea
except ImportError:
    logger.error(msg="Mykytea is not ready to use yet. Install first")

__author__ = "kensuke-mi"


class KyteaWrapper:
    def __init__(self, option_string=""):
        assert isinstance(option_string, (str, str))
        # option string is argument of Kytea.
        self.kytea = Mykytea.Mykytea(option_string)

    def __list_tags(self, t):
        def convert(t2):
            return (t2[0], t2[1])

        return [(word.surface, [[convert(t2) for t2 in t1] for t1 in word.tag]) for word in t]