Python TextBlob.lemmatize Exemples

Langage de programmation: Python

Espace de nommage/Pack: textblob

Class/Type: TextBlob

Méthode/Fonction: lemmatize

Exemples au hotexamples.com: 5

Python TextBlob.lemmatize - 5 exemples trouvés. Ce sont les exemples réels les mieux notés de textblob.TextBlob.lemmatize extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

TextBlob(30)

correct(30)

ngrams(30)

translate(30)

detect_language(30)

lower(30)

classify(30)

split(27)

parse(20)

replace(18)

tokenize(16)

upper(11)

find(10)

strip(5)

lemmatize(5)

append(4)

startswith(4)

singularize(3)

pluralize(3)

draw(3)

__str__(3)

word_counts(2)

remove(2)

sentiment(2)

count(2)

noun_phrases(1)

tags(1)

update(1)

correction(1)

to_json(1)

title(1)

strftime(1)

subjectivity(1)

decode(1)

keys(1)

encode(1)

spellcheck(1)

get(1)

index(1)

pos_tags(1)

__init__(1)

words(1)

Méthodes fréquemment utilisées

TextBlob (30)

correct (30)

ngrams (30)

translate (30)

detect_language (30)

lower (30)

classify (30)

split (27)

parse (20)

replace (18)

Méthodes fréquemment utilisées

tokenize (16)

upper (11)

find (10)

strip (5)

lemmatize (5)

append (4)

startswith (4)

singularize (3)

pluralize (3)

draw (3)

__str__ (3)

word_counts (2)

remove (2)

sentiment (2)

count (2)

noun_phrases (1)

tags (1)

update (1)

correction (1)

to_json (1)

Méthodes fréquemment utilisées

__str__ (3)

word_counts (2)

remove (2)

sentiment (2)

count (2)

noun_phrases (1)

tags (1)

update (1)

correction (1)

to_json (1)

title (1)

strftime (1)

subjectivity (1)

decode (1)

keys (1)

encode (1)

spellcheck (1)

get (1)

index (1)

pos_tags (1)

__init__ (1)

words (1)

Méthodes fréquemment utilisées

title (1)

strftime (1)

subjectivity (1)

decode (1)

keys (1)

encode (1)

spellcheck (1)

get (1)

index (1)

pos_tags (1)

__init__ (1)

words (1)

Exemple #1

0

Afficher le fichier

def get_words(tweet): #create a list of all the words in a tweet tweet_blob = TextBlob(tweet) tweet_blob = tweet_blob.words tweet_blob = tweet_blob.singularize() tweet_blob = tweet_blob.lemmatize( ) #Return a list of the words present in the 50 tweets, lemmatized and singularized L = [] for word in tweet_blob: #we make sure each word is only present one time in the list if word not in L: L += [word] return L

Exemple #2

0

Afficher le fichier

def parseContents(contentList): tupleList = [] posTagger = OpenNLP("/home/rohith/nitk/apache-opennlp-1.6.0", "POSTagger", "en-pos-maxent.bin") chunker = OpenNLP("/home/rohith/nitk/apache-opennlp-1.6.0", "ChunkerME", "en-chunker.bin") for item in contentList: attr = item[0] content = item[1] content = content.replace('\n','') sentences = sent_tokenize(content) for sentence in sentences: print('#'+sentence, file=sys.stderr) extractor = ConllExtractor() np = TextBlob(sentence, np_extractor=extractor).noun_phrases yield attr, np.lemmatize()

Exemple #3

0

Afficher le fichier

Fichier : Constructing a VSM representation and KNN.py Projet : Nemo17864220512/201834864HeJiaheng

def Tokenization_Stemmer(str1): zen = TextBlob(str1) zen = zen.words zen = zen.lemmatize() zen = list(zen) for i in range(len(zen)): w = Word(zen[i]) zen[i] = w.lemmatize("v") for i in range(len(zen)): zen[i] = zen[i].lower() zen = sorted(zen) return zen

Exemple #4

0

Afficher le fichier

def createdb(self): filepath = '/home/an/Desktop/file.log' with open(filepath) as fp: line = fp.readline().strip() strlist = [] str1 = '' while line: # print(len(line.strip())) line = fp.readline() count = len(line.strip()) print(count) if count == 1: str1 += line.strip() else: if len(str1) > 1 and str1.isalpha(): str2 = TextBlob(str1) str1 = str2.correct() str2 = Word(str1) str1 = str2.lemmatize() str1 = str(str1.lower()) strlist.append(str1) str1 = '' fp.close() open('/home/an/Desktop/file.log', 'w').close() dbfile = shelve.open("dbfile") # dbfile.clear() global gb if gb in list(dbfile.keys()): dbfile[gb] += strlist else: dbfile[gb] = strlist # print(list(dbfile.keys())) try: list1 = dbfile[gb] payload = {"username": gb, "tokens": list1} r1 = requests.post('http://127.0.0.1:5000/tokenposter', data=json.dumps(payload)) print(r1.text) if r1.text == 'received': dbfile[gb] = [] except Exception as e: print(e) dbfile.close()

Exemple #5

0

Afficher le fichier

Fichier : Construct a vector.py Projet : Nemo17864220512/201834864HeJiaheng

def Tokenization_Stemmer(str1): zen = TextBlob(str1) zen = zen.words #分词 zen = zen.lemmatize() #名词单复数变原型 zen = list(zen) #动词分词和动名词变原型 for i in range(len(zen)): w = Word(zen[i]) zen[i] = w.lemmatize("v") #所有单词变换为小写 for i in range(len(zen)): zen[i] = zen[i].lower() zen = sorted(zen) return zen