Exemplo n.º 1
0
    def is_tweet_valid(self, tweet):

        if not tweet or "delete" in tweet:
            logger.debug("Empty tweet - skipping")
            return False

        if not "lang" in tweet or tweet["lang"] != "en":
            logger.debug("Non EN - skipping")
            return False

        if not "text" in tweet or tweet["text"].startswith("RT"):
            logger.debug("RE-Tweet found - skipping")
            return False

        folded_text = TwitterMixin.word_map(tweet["text"]).split()
        if "__h__" in folded_text and "__s__" in folded_text:
            logger.debug("Tweet with double emoicons found - skipping")
            return False

        return True
Exemplo n.º 2
0
    def is_tweet_valid(self, tweet):

        if not tweet or 'delete' in tweet:
            logger.debug('Empty tweet - skipping')
            return False

        if not 'lang' in tweet or tweet['lang'] != 'en':
            logger.debug('Non EN - skipping')
            return False

        if not 'text' in tweet or tweet['text'].startswith('RT'):
            logger.debug('RE-Tweet found - skipping')
            return False

        folded_text = TwitterMixin.word_map(tweet['text']).split()
        if '__h__' in folded_text and '__s__' in folded_text:
            logger.debug('Tweet with double emoicons found - skipping')
            return False

        return True
Exemplo n.º 3
0
    def is_tweet_valid(self, tweet):

        if not tweet or 'delete' in tweet:
            logger.debug('Empty tweet - skipping')
            return False

        if not 'lang' in tweet or tweet['lang'] != 'en':
            logger.debug('Non EN - skipping')
            return False

        if not 'text' in tweet or tweet['text'].startswith('RT'):
            logger.debug('RE-Tweet found - skipping')
            return False

        folded_text = TwitterMixin.word_map(tweet['text']).split()
        if '__h__' in folded_text and '__s__' in folded_text:
            logger.debug('Tweet with double emoicons found - skipping')
            return False

        return True
Exemplo n.º 4
0
 def test_word_map(self):
     text = "hello :) :( not xxx :)"
     result = TwitterMixin.word_map(text).split()
     expect = "hello __h__ __s__ __not__ xxx __h__".split()
     self.assertEqual(expect, result)
Exemplo n.º 5
0
 def test_word_map(self):
     text = "hello :) :( not xxx :)"
     result = TwitterMixin.word_map(text).split()
     expect = "hello __h__ __s__ __not__ xxx __h__".split()
     self.assertEqual(expect, result)