Python preprocess_tweet Examples

Programming Language: Python

Namespace/Package Name: pysentimiento.preprocessing

Method/Function: preprocess_tweet

Examples at hotexamples.com: 12

Python preprocess_tweet - 12 examples found. These are the top rated real world Python examples of pysentimiento.preprocessing.preprocess_tweet extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

def test_preprocessing_handles_hashtags():
    """
    Replaces hashtags with text
    """
    text = "esto es #UnaGenialidad"

    assert preprocess_tweet(text) == "esto es una genialidad"

Example #2

Show file

def test_preprocessing_replaces_users():
    """
    Replaces handles with special token for user
    """
    text = "@perezjotaeme debería cambiar esto"

    assert preprocess_tweet(text) == "[USER] debería cambiar esto"

Example #3

Show file

def test_shortens_laughters():
    """
    Replaces laughters
    """

    text = "hahahhahaha can't believe it ahahahahahah"
    assert preprocess_tweet(text, lang="en") == "haha can't believe it haha"

Example #4

Show file

def test_shortens_laughters():
    """
    Replaces laughters
    """

    text = "jajajajaajjajaajajaja no lo puedo creer ajajaj"
    assert preprocess_tweet(text) == "jaja no lo puedo creer jaja"

Example #5

Show file

def test_shortens_repeated_characters():
    """
    Replaces urls with special token for url
    """
    text = "no entiendo naaaaaaaadaaaaaaaa"

    assert preprocess_tweet(text, shorten=2) == "no entiendo naadaa"

Example #6

Show file

def test_preprocessing_replaces_urls():
    """
    Replaces urls with special token for url
    """
    text = "esto es muy bueno http://bit.ly/sarasa"

    assert preprocess_tweet(text) == "esto es muy bueno [URL]"

Example #7

Show file

File: preprocess_tweet_file.py Project: finiteautomata/pysentimiento

def my_preprocess(*args):
    return preprocess_tweet(*args, **{
        "user_token": "USUARIO",
        "url_token": "URL",
        "hashtag_token": "hashtag",
        "emoji_wrapper": "",
    })

Example #8

Show file

def preprocess(tweet):
    """
    My preprocess
    """
    ret = preprocess_tweet(tweet, **preprocess_args)
    ret = re.sub("\n+", ". ", ret)
    ret = re.sub(r"\s+", " ", ret)
    return ret.strip()

Example #9

Show file

def test_replaces_emoji_in_english():
    """

    Replaces “ -> "

    """
    text = "🤣"
    assert preprocess_tweet(
        text, lang="en") == ' [EMOJI] rolling on the floor laughing [EMOJI] '

Example #10

Show file

def test_replaces_emoji():
    """

    Replaces “ -> "

    """
    text = "🤣"
    assert preprocess_tweet(
        text) == ' [EMOJI] cara revolviéndose de la risa [EMOJI] '

Example #11

Show file

def test_replaces_odd_quotation_marks():
    """

    Replaces “ -> "

    """
    text = "Pero pará un poco, “loquita”"

    assert preprocess_tweet(text) == 'Pero pará un poco, "loquita"'

Example #12

Show file

File: async_generate_txts.py Project: finiteautomata/spritzer-tweets

def my_preprocess(tweet):

    ret = preprocess_tweet(tweet, **preprocess_args)
    ret = re.sub("\n+", ". ", ret)
    ret = re.sub(r"\s+", " ", ret)
    return ret.strip()