Python FreqDist.has_key Examples

Programming Language: Python

Namespace/Package Name: nltk.probability

Class/Type: FreqDist

Method/Function: has_key

Examples at hotexamples.com: 7

Python FreqDist.has_key - 7 examples found. These are the top rated real world Python examples of nltk.probability.FreqDist.has_key extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

values(30)

freq(30)

plot(30)

most_common(30)

keys(30)

items(30)

inc(30)

iteritems(30)

N(30)

update(27)

get(24)

B(19)

hapaxes(14)

max(11)

FreqDist(11)

tabulate(9)

samples(8)

pprint(7)

pop(4)

has_key(3)

count(3)

append(2)

sorted_samples(1)

read(1)

sorted(1)

remove(1)

copy(1)

r_Nr(1)

next(1)

__iter__(1)

iterkeys(1)

__setitem__(1)

insert(1)

_cumulative_frequencies(1)

__init__(1)

Example #1

Show file

File: build_bigram_features.py Project: ravikiranp/MovieReviewClassifier

def build(master_dict, path, l, fh):
	master = ()
	master = sorted(master_dict)

	m_dict = OrderedDict()
	for item in master:
		m_dict[item] = 0	
	
	fhl=open(path,"r")
	lines = fhl.read().split()
	#lines = re.sub("[()+.,\']",'',lines)
	#words = nltk.tokenize.word_tokenize(lines)
	bi_lines = bigrams(lines)	
	temp = FreqDist(bi_lines)
	fhl.close()

	#temp = get_bigram_file(path)
	for key in m_dict.iterkeys():
		if temp.has_key(key):
			m_dict[key] = temp[key]
		else:
			m_dict[key] = 0
	#m_dict.update(temp)
	values = list()
	for val in m_dict.itervalues():
		values.append(str(val))
	#print len(values)	
	fh.write(l+","+",".join(values))
	fh.write('\n')

Example #2

Show file

class termBased(AbstractGenerativeModel):

    #It requires to pass analyser that will break document into tokens.
    #It can also remove stopwords and make normalization for words.
    def __init__(self, analyser):
        self.analyser = analyser
        print("Term Based ")

    def generateProbabilityDistribution(self, document_list):
        tokens = []
        for doc in document_list:
            tokens += self.analyser(doc)
        self.freqDist = FreqDist(tokens)

    def getProbabilityDistribution(self):
        return self.freqDist

    def probOfDocument(self, document):
        tokens = self.analyser(document)
        prob = 1.0
        for token in tokens:
            if self.freqDist.has_key(token):
                prob *= self.freqDist.freq(token)
        if prob == 1.0:
            return 0.0
        return prob

Example #3

Show file

File: SVM.py Project: abhinavmishra590/NLPbased-Automated_Tagging_System

 def featureList(corpus):
     featList = []
     for post in corpus:
         listItem = [0]*noFeat
         fileFreqDist = FreqDist()
         fileFreqDist = nltk.FreqDist(nltk.word_tokenize(post))
         
         i =0
         for key in trainKeys:
             if fileFreqDist.has_key(key):
                 listItem[i] = fileFreqDist.get(key)
             i=i+1
             
         featList.append(listItem)
         
     return featList

Example #4

Show file

    def featureList(corpus):
        featList = []
        for post in corpus:
            listItem = [0] * noFeat
            fileFreqDist = FreqDist()
            fileFreqDist = nltk.FreqDist(nltk.word_tokenize(post))

            i = 0
            for key in trainKeys:
                if fileFreqDist.has_key(key):
                    listItem[i] = fileFreqDist.get(key)
                i = i + 1

            featList.append(listItem)

        return featList

Example #5

Show file

File: SVM.py Project: ashish0038/sentimentAnalysis

def featureList(corpus):
    featList = []
    for trFile in corpus.fileids():
        listItem = [0]*noFeat
        fileFreqDist = FreqDist()
        fileFreqDist = nltk.FreqDist(corpus.words(trFile))
        
        i =0
        for key in trainKeys:
            if fileFreqDist.has_key(key):
                listItem[i] = fileFreqDist.get(key)
            i=i+1
            
        featList.append(listItem)
        
    return featList

Example #6

Show file

File: SVM.py Project: abhinavmishra590/NLPbased-Automated_Tagging_System

def createFeatures(sentVect, ordList):
    
    noFeat = len(ordList)
    
    featList = []
    for post in sentVect:
        listItem = [0]*noFeat
        fileFreqDist = FreqDist()
        fileFreqDist = nltk.FreqDist(nltk.word_tokenize(post))
            
        i =0
        for key in ordList:
            if fileFreqDist.has_key(key):
                listItem[i] = fileFreqDist.get(key)
            i=i+1
                
        featList.append(listItem)
            
    return featList

Example #7

Show file

def createFeatures(sentVect, ordList):

    noFeat = len(ordList)

    featList = []
    for post in sentVect:
        listItem = [0] * noFeat
        fileFreqDist = FreqDist()
        fileFreqDist = nltk.FreqDist(nltk.word_tokenize(post))

        i = 0
        for key in ordList:
            if fileFreqDist.has_key(key):
                listItem[i] = fileFreqDist.get(key)
            i = i + 1

        featList.append(listItem)

    return featList