Python words示例

编程语言: Python

命名空间/包名称: nltk.stopwords

方法/功能: words

hotexamples.com的示例: 6

Python words - 已找到6个示例。这些是从开源项目中提取的最受好评的nltk.stopwords.words现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

def remove_stopwords(words):
    """Remove stop words from list of tokenized words"""
    new_words = []
    for word in words:
        if word not in stopwords.words('english'):
            new_words.append(word)
    return new_words

示例#2

显示文件

文件： clean_tt_df.py 项目： c0ns0le/future-employment

def remove_punc_stopwords_lower(s):
    """
    INPUT: string
    OUTPUT: string

    removes stopwords from the string and lower-cases the string.
    """
    stop = stopwords.words('english')
    regex = r"\W+"
    return " ".join([i for i in re.split(regex, s.lower()) if i not in stop])

示例#3

显示文件

文件： sentiment_analysis_model_evaluation.py 项目： al-bose/H8rs-Gonna-H8

def generate_unigrams(text):

    list_of_c_punctuation = string.punctuation
    stop_words = stopwords.words('english')
    unigrams = []

    punctuation_removed = [
        char for char in list(text) if char not in list_of_c_punctuation
    ]
    punctuation_removed = ''.join(punctuation_removed)

    return [
        word for word in punctuation_removed.split()
        if word.lower() not in stop_words
    ]

示例#4

显示文件

文件： frequency.py 项目： saromanov/topic-extraction

 def __init__(self, data):
     self.stop = stopwords.words("english")
     self.data = [word_tokenize(word) for word in data]

示例#5

显示文件

文件： walker_scraps.py 项目： mjlavin80/walker

from nltk import stopwords

filtered_words = [word for word in word_list if word not in stopwords.words('english')]

def comp(list1, list2):
	walker_count = 0
	nomatches = []
	for i in list1:

		if i in list2:
			walker_count +=1
		else:
			nomatches.append(i)

	return walker_count*1.0/len(list1), nomatches

示例#6

显示文件

文件： frequency.py 项目： avatarzhang/topic-extraction

	def __init__(self, data):
		self.stop = stopwords.words("english")
		self.data = [word_tokenize(word) for word in data]