Python Frequencyの例

プログラミング言語: Python

名前空間/パッケージ名: counting

クラス/型: Frequency

hotexamples.comのコード掲載数: 4

Python Frequency - 4件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのcounting.Frequencyの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Frequency(1)

increment(1)

コード例 #1

ファイルを表示

class NGramCounter(object):
    """
    Takes as input a corpus, and then updates an internal frequency with
    word counts from the corpus.
    """
    def __init__(self, corpus, N=1):
        self.corpus = corpus
        self.frequency = Frequency()
        self.N = N

    def words(self):
        """
        A generator that goes through all the words in the corpus, makes
        them lowercase and (possibly) could remove punctuation or stopwords
        """
        for reader in self.corpus:
            for word in reader.words():
                word = word.strip()
                if word:
                    yield word.lower()

    def __iter__(self):
        """
        Expects a generator to return the specific ngram to save in the
        frequency counts.
        """
        if self.N == 1:
            # Special case for Unigrams
            for word in self.words():
                yield word
        else:
            ngram = []
            for word in self.words():
                if len(ngram) < self.N:
                    ngram.append(word)
                if len(ngram) == self.N:
                    yield tuple(ngram)
                    ngram = ngram[1:]

    def count(self):
        if not self.frequency:
            for ngram in self:
                self.frequency.increment(ngram)
        return self.frequency

コード例 #2

ファイルを表示

ファイル: ngram.py プロジェクト: bbengfort/ngram-light

class NGramCounter(object):
    """
    Takes as input a corpus, and then updates an internal frequency with
    word counts from the corpus.
    """

    def __init__(self, corpus, N=1):
        self.corpus = corpus
        self.frequency = Frequency()
        self.N = N

    def words(self):
        """
        A generator that goes through all the words in the corpus, makes
        them lowercase and (possibly) could remove punctuation or stopwords
        """
        for reader in self.corpus:
            for word in reader.words():
                word = word.strip()
                if word:
                    yield word.lower()

    def __iter__(self):
        """
        Expects a generator to return the specific ngram to save in the
        frequency counts.
        """
        if self.N == 1:
            # Special case for Unigrams
            for word in self.words(): yield word
        else:
            ngram = []
            for word in self.words():
                if len(ngram) < self.N:
                    ngram.append(word)
                if len(ngram) == self.N:
                    yield tuple(ngram)
                    ngram = ngram[1:]

    def count(self):
        if not self.frequency:
            for ngram in self:
                self.frequency.increment(ngram)
        return self.frequency

コード例 #3

ファイルを表示

 def __init__(self, corpus, N=1):
     self.corpus = corpus
     self.frequency = Frequency()
     self.N = N

コード例 #4

ファイルを表示

ファイル: ngram.py プロジェクト: bbengfort/ngram-light

 def __init__(self, corpus, N=1):
     self.corpus = corpus
     self.frequency = Frequency()
     self.N = N