示例#1
0
    def scrap_episode(self, episode, url):
        html = urllib.urlopen(url).read()
        html = re.sub('<\?.*?\?>','',html)
        soup = BeautifulSoup(html, from_encoding='utf8')
        
        episode.air = date(*map(int, reversed(soup.find('td','fecha-hora').text.split('/'))))
        
        fileset = MediaFileSet()
        fileset.episode = episode
        fileset.save()

        for cnt,embed in enumerate(soup('embed')):
            video_id = re.findall('/([^/]*?)\?', embed.get('src'))[0]

            media = HttpMediaFile()
            media.url = self.get_real_url(video_id)
            if media.url is None:
                print "ERROR"
                continue
            media.precedence = cnt+1
            print cnt+1
            media.save()
            fileset.medias.add(media)
        fileset.save()