Python _get_root Examples

Programming Language: Python

Namespace/Package Name: nltk.corpus.stopwords

Method/Function: _get_root

Examples at hotexamples.com: 5

Python _get_root - 5 examples found. These are the top rated real world Python examples of nltk.corpus.stopwords._get_root extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

File: filter.py Project: zhoubo3666/orange3-text

    def supported_languages():
        # get NLTK list of stopwords
        stopwords_listdir = []
        try:
            stopwords_listdir = [file for file in
                                 os.listdir(stopwords._get_root())
                                 if file.islower()]
            print("stopwords._get_root():"+stopwords._get_root())
        except LookupError:  # when no NLTK data is available
            pass

        return [file.capitalize() for file in stopwords_listdir]

Example #2

Show file

File: filter.py Project: s-alexey/orange3-text

    def supported_languages():
        # get NLTK list of stopwords
        stopwords_listdir = []
        try:
            stopwords_listdir = [file for file in
                                 os.listdir(stopwords._get_root())
                                 if file.islower()]
        except LookupError:  # when no NLTK data is available
            pass

        return [file.capitalize() for file in stopwords_listdir]

Example #3

Show file

File: filter.py Project: szzyiit/orange3-text

    def supported_languages():
        # get NLTK list of stopwords
        stopwords_listdir = []
        try:
            stopwords_listdir = [
                file for file in os.listdir(stopwords._get_root())
                if file.islower()
            ]
        except LookupError:  # when no NLTK data is available
            pass

        # return sorted(file.capitalize() for file in stopwords_listdir)
        all_stopwords_listdir = ['中文'] + \
            sorted(file.capitalize() for file in stopwords_listdir)
        return all_stopwords_listdir

Example #4

Show file

File: filter.py Project: undarmaa/orange3-text

    def from_file(self, path):
        self.file_path = path
        if not path:
            self.word_list = []
        else:
            enc = detect_encoding(path)
            with open(path, encoding=enc) as f:
                self.word_list = set([line.strip() for line in f])


# get NLTK list of stopwords
stopwords_listdir = []
try:
    stopwords_listdir = [
        file for file in os.listdir(stopwords._get_root()) if file.islower()
    ]
except LookupError:  # when no NLTK data is available
    pass


class StopwordsFilter(BaseTokenFilter, WordListMixin):
    """ Remove tokens present in NLTK's language specific lists or a file. """
    name = 'Stopwords'

    supported_languages = [file.capitalize() for file in stopwords_listdir]

    @wait_nltk_data
    def __init__(self, language='English', word_list=None):
        WordListMixin.__init__(self, word_list)
        super().__init__()

Example #5

Show file

File: filter.py Project: webisaac/orange3-text

        self.file_path = None
        self.word_list = word_list or []

    def from_file(self, path):
        self.file_path = path
        if not path:
            self.word_list = []
        else:
            enc = detect_encoding(path)
            with open(path, encoding=enc) as f:
                self.word_list = set([line.strip() for line in f])

# get NLTK list of stopwords
stopwords_listdir = []
try:
    stopwords_listdir = [file for file in os.listdir(stopwords._get_root())
                         if file.islower()]
except LookupError:     # when no NLTK data is available
    pass


class StopwordsFilter(BaseTokenFilter, WordListMixin):
    """ Remove tokens present in NLTK's language specific lists or a file. """
    name = 'Stopwords'

    supported_languages = [file.capitalize() for file in stopwords_listdir]

    def __init__(self, language='English', word_list=None):
        WordListMixin.__init__(self, word_list)
        super().__init__()
        self.language = language