Python _get_root 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: nltk.corpus.stopwords

메소드/함수: _get_root

hotexamples.com에서의 예제들: 5

Python _get_root - 5개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 nltk.corpus.stopwords._get_root에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: filter.py 프로젝트: zhoubo3666/orange3-text

    def supported_languages():
        # get NLTK list of stopwords
        stopwords_listdir = []
        try:
            stopwords_listdir = [file for file in
                                 os.listdir(stopwords._get_root())
                                 if file.islower()]
            print("stopwords._get_root():"+stopwords._get_root())
        except LookupError:  # when no NLTK data is available
            pass

        return [file.capitalize() for file in stopwords_listdir]

예제 #2

파일 보기

파일: filter.py 프로젝트: s-alexey/orange3-text

    def supported_languages():
        # get NLTK list of stopwords
        stopwords_listdir = []
        try:
            stopwords_listdir = [file for file in
                                 os.listdir(stopwords._get_root())
                                 if file.islower()]
        except LookupError:  # when no NLTK data is available
            pass

        return [file.capitalize() for file in stopwords_listdir]

예제 #3

파일 보기

파일: filter.py 프로젝트: szzyiit/orange3-text

    def supported_languages():
        # get NLTK list of stopwords
        stopwords_listdir = []
        try:
            stopwords_listdir = [
                file for file in os.listdir(stopwords._get_root())
                if file.islower()
            ]
        except LookupError:  # when no NLTK data is available
            pass

        # return sorted(file.capitalize() for file in stopwords_listdir)
        all_stopwords_listdir = ['中文'] + \
            sorted(file.capitalize() for file in stopwords_listdir)
        return all_stopwords_listdir

예제 #4

파일 보기

파일: filter.py 프로젝트: undarmaa/orange3-text

    def from_file(self, path):
        self.file_path = path
        if not path:
            self.word_list = []
        else:
            enc = detect_encoding(path)
            with open(path, encoding=enc) as f:
                self.word_list = set([line.strip() for line in f])


# get NLTK list of stopwords
stopwords_listdir = []
try:
    stopwords_listdir = [
        file for file in os.listdir(stopwords._get_root()) if file.islower()
    ]
except LookupError:  # when no NLTK data is available
    pass


class StopwordsFilter(BaseTokenFilter, WordListMixin):
    """ Remove tokens present in NLTK's language specific lists or a file. """
    name = 'Stopwords'

    supported_languages = [file.capitalize() for file in stopwords_listdir]

    @wait_nltk_data
    def __init__(self, language='English', word_list=None):
        WordListMixin.__init__(self, word_list)
        super().__init__()

예제 #5

파일 보기

파일: filter.py 프로젝트: webisaac/orange3-text

        self.file_path = None
        self.word_list = word_list or []

    def from_file(self, path):
        self.file_path = path
        if not path:
            self.word_list = []
        else:
            enc = detect_encoding(path)
            with open(path, encoding=enc) as f:
                self.word_list = set([line.strip() for line in f])

# get NLTK list of stopwords
stopwords_listdir = []
try:
    stopwords_listdir = [file for file in os.listdir(stopwords._get_root())
                         if file.islower()]
except LookupError:     # when no NLTK data is available
    pass


class StopwordsFilter(BaseTokenFilter, WordListMixin):
    """ Remove tokens present in NLTK's language specific lists or a file. """
    name = 'Stopwords'

    supported_languages = [file.capitalize() for file in stopwords_listdir]

    def __init__(self, language='English', word_list=None):
        WordListMixin.__init__(self, word_list)
        super().__init__()
        self.language = language