Python DbUtil.compute_meanings 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: asian_word_analyzer.korean.db

클래스/타입: DbUtil

메소드/함수: compute_meanings

hotexamples.com에서의 예제들: 4

Python DbUtil.compute_meanings - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 asian_word_analyzer.korean.db.DbUtil.compute_meanings에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

DbUtil(9)

compute_meanings(2)

get_hanja_meaning(2)

get_hanja_name(2)

get_hanja(1)

예제 #1

파일 보기

파일: test_korean_db.py 프로젝트: jbfiot/AsianWordAnalyzer

def test_compute_meanings():
    util = DbUtil()
    assert '(평안) (public) peace (안정) stability, well' in util.compute_meanings(u'안녕').values

예제 #2

파일 보기

파일: word.py 프로젝트: jbfiot/AsianWordAnalyzer

class KoreanWord(object):
    """ This class is used to manipulate Korean words. """
    def __init__(self, string='', ethym=None, meaning=None, compute_ethym=False):
        self.string = _u(string)  # e.g. user input string
        self.language = 'Korean'
        self.db_util = DbUtil()

        if ethym and meaning:
            assert(len(string) == len(ethym)) # to the best of my knowledge a
                                              # Korean word and its hanja
                                              # representation (when existing)
                                              # have the same lengths
            self.blocks = [[Block(string[i], ethym=ethym[i]) for i in range(len(string))]]
            self.meanings = [meaning]
            self.selected_meaning = 0 # the word is clearly defined

        else:
            self.compute_suffix()
            self.blocks = self.compute_blocks(compute_ethym)
            self.meanings = self.db_util.compute_meanings(self.string_without_suffix) # Different meanings in English
            self.selected_meaning = 0 # index of the selected meaning


    @property
    def meaning(self):
        """ Meaning getter """
        return self.meanings[self.selected_meaning]

    def get_blocks_for_selected_meaning(self):
        """ Getter for the blocks corresponding to the selected meaning """
        return self.blocks[self.selected_meaning]

    @property    
    def ethym(self):
        return ''.join([block.ethym for block in \
                    self.blocks[self.selected_meaning] if block.ethym])

    #==========================================================================
    #  PRINT METHODS
    #==========================================================================

    def print_blocks_for_selected_meaning(self):
        """ This methods prints the block strings for the selected meaning.

        Example:
        --------
            For the word '안녕', the printed blocks will be ['안', '녕']
        """
        return [block.string for block in self.blocks[self.selected_meaning]]


    #==========================================================================
    #   LANGUAGE METHODS
    #==========================================================================

    def compute_suffix(self):
        """ This method computes:
        self.suffix
        self.suffix_meaning
        self.string_without_suffix
        """
        suffixes = {u'하다':u'하다 verb particule', \
                    u'합니다': u'formal 하다 ending', \
                    u'하세요': u'formal imperative form of 하다', \
                    u'요': u'politeness particle',\
                    u'님': u'honorific particle'}
        # TODO: store the suffixes in the database instead of hardcoding them here

        detected_suffix = ''
        for suffix in suffixes.keys():
            if self.string.endswith(suffix):
                detected_suffix = suffix
                continue
        self.string_without_suffix = self.string[0:len(self.string)-len(detected_suffix)]
        self.suffix = detected_suffix
        self.suffix_meaning = suffixes.get(detected_suffix, None)

    def compute_blocks(self, compute_ethym=False):
        """ Compute the blocks given the input string.

        Output:
            Returns a list of lists of blocks, i.e.
            [ [b11, ..., b1n1], [b21, ..., b2n2], ...], where each list of
            blocks [bi1, ..., bini] corresponds to a possible meaning of the
            input string.

        Note:
            In this implemenation, only one meaning is available.
        """
        if DEBUG:
            UI.render_info('compute_blocks(...) called for word ' + self.string)

        if not compute_ethym:
            blocks = [Block(self.string_without_suffix[i]) \
                            for i in range(len(self.string_without_suffix)) \
                            if self.string_without_suffix[i] != ' ']
        else:
            ethym = get_hanja(self.string_without_suffix)
            if DEBUG:
                UI.render_info(ethym)

            blocks = [Block(self.string_without_suffix[i], ethym=ethym[i], \
                        meaning=self.db_util.get_hanja_meaning(ethym[i]), \
                        name=self.db_util.get_hanja_name(ethym[i])) \
                        for i in range(len(self.string_without_suffix)) \
                        if self.string_without_suffix[i] != ' ']

        if self.suffix:
            suffix_desc = 'Suffix: ' + self.suffix_meaning
            blocks.append(Block(self.suffix, meaning=suffix_desc))

        return [blocks]

예제 #3

파일 보기

 def test_compute_meanings(self):
     util = DbUtil()
     assert '(평안) (public) peace (안정) stability, well' in util.compute_meanings(u'안녕')

예제 #4

파일 보기

class KoreanWord(AsianWord):
    """ This class is used to manipulate Korean words. """
    language = 'Korean'

    def __init__(self,
                 string='',
                 etymology=None,
                 meaning=None,
                 compute_etymology=False):
        self.check_init_parameters(string, etymology, meaning)
        self.string = _u(string)  # e.g. user input string
        self.db_util = DbUtil()

        if etymology and meaning:
            self.blocks = [[
                Block(string[i], etymology=etymology[i])
                for i in range(len(string))
            ]]
            self.meanings = [meaning]
            self.selected_meaning = 0  # the word is clearly defined

        else:
            self.compute_suffix()
            self.blocks = self.compute_blocks(compute_etymology)
            self.meanings = self.db_util.compute_meanings(
                self.string_without_suffix)  # Different meanings in English
            self.selected_meaning = 0  # index of the selected meaning

    @staticmethod
    def check_init_parameters(string, etymology, meaning):
        if etymology is not None:
            if len(string) != len(etymology):
                # to the best of my knowledge a Korean word and its hanja
                # representation (when existing) have the same lengths
                raise ValueError(
                    'string and etymology must have the same lengths')

    def compute_suffix(self):
        """ This method computes:
        self.suffix
        self.suffix_meaning
        self.string_without_suffix
        """
        suffixes = {
            u'하다': u'하다 verb particle',
            u'합니다': u'formal 하다 ending',
            u'하세요': u'formal imperative form of 하다',
            u'요': u'politeness particle',
            u'님': u'honorific particle'
        }
        # TODO: store the suffixes in the database instead of hardcoding them here

        detected_suffix = ''
        for suffix in suffixes.keys():
            if self.string.endswith(suffix):
                detected_suffix = suffix
                continue
        self.string_without_suffix = self.string[0:len(self.string) -
                                                 len(detected_suffix)]
        self.suffix = detected_suffix
        self.suffix_meaning = suffixes.get(detected_suffix, None)

    def compute_blocks(self, compute_etymology=False):
        """ Compute the blocks given the input string.

        Output:
            Returns a list of lists of blocks, i.e.
            [ [b11, ..., b1n1], [b21, ..., b2n2], ...], where each list of
            blocks [bi1, ..., bini] corresponds to a possible meaning of the
            input string.

        Note:
            In this implementation, only one meaning is available.
        """
        ui.render_debug('compute_blocks(...) called for word ' + self.string)

        if compute_etymology:
            etymology = self.db_util.get_hanja(self.string_without_suffix)
            if etymology:
                ui.render_debug('Found hanja={}'.format(etymology))

                blocks = [
                    Block(self.string_without_suffix[i],
                          etymology=etymology[i],
                          meaning=self.db_util.get_hanja_meaning(etymology[i]),
                          name=self.db_util.get_hanja_name(etymology[i]))
                    for i in range(len(self.string_without_suffix))
                    if self.string_without_suffix[i] != ' '
                ]
            else:
                ui.render_error(
                    'Hanja not found for {}.'
                    'Please check the spelling or populate the `Korean` table '
                    'with more data.'.format(self.string_without_suffix))
                blocks = []
        else:
            blocks = [
                Block(self.string_without_suffix[i])
                for i in range(len(self.string_without_suffix))
                if self.string_without_suffix[i] != ' '
            ]

        if self.suffix:
            suffix_desc = 'Suffix: ' + self.suffix_meaning
            blocks.append(Block(self.suffix, meaning=suffix_desc))

        return [blocks]