Exemplo n.º 1
0
class TextGetter:

    def __init__(self, reddit, subreddit='showerthoughts', badlist='bad-words.txt'):
        self.reddit = reddit
        self.subreddit = subreddit
        self.badlist = badlist
        self.logger = logging.getLogger('reddit')
        self._seen = DroppingSet(50)

    def get_text(self):
        bad_words = self.get_bad_words()
        try:
            subs = self.reddit.get_subreddit(self.subreddit).get_new()
            text = None
            while text is None or text in self._seen or 'r/showerthoughts' in text.lower():
                text = next(subs).title
                lower_text = text.lower()
                for bad in bad_words:
                    if bad in lower_text:
                        self.logger.debug('Rejecting text because matched "{}" in "{}"'.format(bad, text))
                        text = None
                        break
            self._seen.add(text)
            return text
        except StopIteration:
            return None

    def get_bad_words(self):
        if self.badlist and os.path.isfile(self.badlist):
            with open(self.badlist) as fh:
                return fh.read().splitlines()
        else:
            return []
Exemplo n.º 2
0
 def test_add_discard(self):
     ds = DroppingSet(10)
     ds.add(4)
     ds.add(3)
     self.assertTrue(4 in ds)
     self.assertTrue(3 in ds)
     ds.discard(4)
     self.assertFalse(4 in ds)
     self.assertTrue(3 in ds)
Exemplo n.º 3
0
class ImageGetter:

    def __init__(self, reddit, subreddit='earthporn', aspect_ratio=1.6):
        self.reddit = reddit
        self.subreddit = subreddit
        self.aspect_ratio = aspect_ratio
        self.logger = logging.getLogger('reddit')
        self._seen = DroppingSet(50)

    def get_image(self, path):
        try:
            subs = self.reddit.get_subreddit(self.subreddit).get_new(limit=50)
            url = self._get_image_url(subs)
            while url is None or url in self._seen:
                if url is not None:
                    self.logger.debug('Already seen!')
                url = self._get_image_url(subs)
            self._seen.add(url)
        except StopIteration:
            if self._seen:
                num_seen = len(self._seen)
                msg = 'Did not find a suitable image; reusing one of {} seen before.'
                self.logger.debug(msg.format(num_seen))
                url = random.choice(self._seen)
            else:
                self.logger.debug('Could not find any suitable images :(')
                return None
        response = requests.get(url, stream=True)
        if response.status_code == 200:
            response.raw.decode_content = True
            with open(path, 'wb') as wfh:
                shutil.copyfileobj(response.raw, wfh)
        return path

    def _get_image_url(self, subs):
        next_sub = next(subs)
        preview = getattr(next_sub, 'preview', None)
        if not preview:
            return None
        images = preview.get('images', {})
        for image in images:
            source = image['source']
            self.logger.debug('found "{}" {}x{}'.format(source['url'],
                                                        source['width'], source['height']))
            image_aspect_ratio = source['width'] / source['height']
            if int(source['width']) > IMG_MAX_SIZE or int(source['height']) > IMG_MAX_SIZE:
                self.logger.debug('too large!')
                continue
            if abs(self.aspect_ratio - image_aspect_ratio) < 1.0:
                return source['url']
            else:
                self.logger.debug('Wrong aspect ratio! {:.02}'.format(image_aspect_ratio))
Exemplo n.º 4
0
 def test_max(self):
     ds = DroppingSet(4)
     ds.add(1)
     ds.add(2)
     ds.add(3)
     ds.add(4)
     self.assertTrue(1 in ds)
     self.assertTrue(4 in ds)
     ds.add(5)
     self.assertFalse(1 in ds)
     self.assertTrue(2 in ds)
     self.assertTrue(4 in ds)
     self.assertTrue(5 in ds)
     ds.add(6)
     self.assertFalse(2 in ds)
Exemplo n.º 5
0
 def test_order(self):
     ds = DroppingSet(10)
     ds.add(4)
     ds.add(3)
     ds.add(42)
     self.assertEqual(ds.pop(), 42)
     self.assertEqual(ds.pop(), 3)
     self.assertEqual(ds.pop(), 4)
Exemplo n.º 6
0
 def test_max(self):
     ds = DroppingSet(4)
     ds.add(1)
     ds.add(2)
     ds.add(3)
     ds.add(4)
     self.assertTrue(1 in ds)
     self.assertTrue(4 in ds)
     ds.add(5)
     self.assertFalse(1 in ds)
     self.assertTrue(2 in ds)
     self.assertTrue(4 in ds)
     self.assertTrue(5 in ds)
     ds.add(6)
     self.assertFalse(2 in ds)
Exemplo n.º 7
0
 def test_order(self):
     ds = DroppingSet(10)
     ds.add(4)
     ds.add(3)
     ds.add(42)
     self.assertEqual(ds.pop(), 42)
     self.assertEqual(ds.pop(), 3)
     self.assertEqual(ds.pop(), 4)
Exemplo n.º 8
0
 def test_add_discard(self):
     ds = DroppingSet(10)
     ds.add(4)
     ds.add(3)
     self.assertTrue(4 in ds)
     self.assertTrue(3 in ds)
     ds.discard(4)
     self.assertFalse(4 in ds)
     self.assertTrue(3 in ds)
Exemplo n.º 9
0
 def __init__(self, reddit, subreddit='showerthoughts', badlist='bad-words.txt'):
     self.reddit = reddit
     self.subreddit = subreddit
     self.badlist = badlist
     self.logger = logging.getLogger('reddit')
     self._seen = DroppingSet(50)
Exemplo n.º 10
0
 def __init__(self, reddit, subreddit='earthporn', aspect_ratio=1.6):
     self.reddit = reddit
     self.subreddit = subreddit
     self.aspect_ratio = aspect_ratio
     self.logger = logging.getLogger('reddit')
     self._seen = DroppingSet(50)