Ejemplos de normalize_words en Python

Lenguaje de programación: Python

Namespace/Package Name: utils

Método / Función: normalize_words

Ejemplos en hotexamples.com: 4

Python normalize_words - 4 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de utils.normalize_words extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Ejemplo n.º 1

Mostrar archivo

Archivo: terms_counter.py Proyecto: boechat107/map-reduce_python-ex

def reducefn(author, titles):
    from stopwords import allStopWords
    from utils import normalize_words
    terms_freq = {}
    for title in titles:
        ### Main tasks to do: normalize words (lower case), delete stopwords, punctuation,
        ### hyphens, single letter words and count the cumulative frequency.
        title_terms = normalize_words(title)
        for term in title_terms.split():
            ## allStopWords comes from stopwords file.
            ## Single letter words are removed.
            if not (allStopWords.has_key(term) or len(term) == 1):
                if terms_freq.has_key(term):
                    terms_freq[term] = terms_freq[term] + 1
                else:
                    terms_freq[term] = 1
    ## Reduce results.
    return terms_freq

Ejemplo n.º 2

Mostrar archivo

Archivo: terms_counter.py Proyecto: boechat107/map-reduce_python-ex

def reducefn(author, titles):
    from stopwords import allStopWords
    from utils import normalize_words
    terms_freq = {}
    for title in titles:
        ### Main tasks to do: normalize words (lower case), delete stopwords, punctuation,
        ### hyphens, single letter words and count the cumulative frequency.
        title_terms = normalize_words(title)
        for term in title_terms.split():
            ## allStopWords comes from stopwords file.
            ## Single letter words are removed.
            if not (allStopWords.has_key(term) or len(term) == 1):
                if terms_freq.has_key(term):
                    terms_freq[term] = terms_freq[term] + 1
                else:
                    terms_freq[term] = 1
    ## Reduce results.
    return terms_freq

Ejemplo n.º 3

Mostrar archivo

Archivo: terms_counter.py Proyecto: boechat107/map-reduce_python-ex

def mapfn(filenumber, filecontent):
    from utils import normalize_words
    ## Emits all the contents for each author
    author_contents = {}
    for line in filecontent.splitlines():
        ## conf:::author_1::author2:::title
        docdata = line.split(':::')
        authors_list = docdata[1].split('::')
        title = docdata[-1]
        for author in authors_list:
            author = normalize_words(author)
            if author_contents.has_key(author):
                author_contents[author] = author_contents[author] + " " + title
            else:
                author_contents[author] = title
    ## Map results
    for author in author_contents.keys():
        yield author, author_contents[author]

Ejemplo n.º 4

Mostrar archivo

Archivo: terms_counter.py Proyecto: boechat107/map-reduce_python-ex

def mapfn(filenumber, filecontent):
    from utils import normalize_words
    ## Emits all the contents for each author
    author_contents = {}
    for line in filecontent.splitlines():
        ## conf:::author_1::author2:::title
        docdata = line.split(':::')
        authors_list = docdata[1].split('::')
        title = docdata[-1]
        for author in authors_list:
            author = normalize_words(author)
            if author_contents.has_key(author):
                author_contents[author] = author_contents[author] + " " + title
            else:
                author_contents[author] = title
    ## Map results
    for author in author_contents.keys():
        yield author, author_contents[author]