示例#1
0
def social_news_from_link(ref_link):
    row = {'titulos': [], 'links': [], 'noticia': [], 'image': [], 'abstract': [], 'date': [], 
           'fb_comment': [], 'fb_share': [], 'fb_reaction': [], 'fb_total': []}
    
    article = NewsPlease.from_url(ref_link)
    if (article is not None):
        # Data returned by the NewsPlease
        row['titulos'].append(article.title)
        row['noticia'].append(article.text)
        row['links'].append(article.url)
        row['abstract'].append(article.text)
        formated_date = str(article.date_publish)
        row['date'].append(formated_date)
        path_image = article.image_url
        if path_image == '' or path_image == None:
            row['image'].append(0)
        else:
            row['image'].append(download_and_move_image(article.image_url))
        
        fb_comment, fb_share, fb_reaction, fb_total = util.get_sharedcount_info(article.url)

        row['fb_comment'].append(fb_comment)
        row['fb_share'].append(fb_share)
        row['fb_reaction'].append(fb_reaction)
        row['fb_total'].append(fb_total)
    
        social_news = Social_News(row['abstract'], row['noticia'], row['date'], row['links'], row['titulos'], row['image'],
                                    row['fb_comment'], row['fb_share'], row['fb_reaction'], row['fb_total'])
        
        try:
            print(row['titulos'])
            news_in_db = midia_table.check_news(social_news)
            print('news_in_db: ' + str(news_in_db))
            
            if(not news_in_db):
                row = pd.DataFrame(row)
                df, categories = midia_lexical.lexical_corpus_and_title(row)
                
                # DB categories and image
                if(categories != [set()]):
                    social_news.set_categories(categories)
                    midia_table.save_news(social_news)
                    midia_post.post_news(df)
                    
        except:
            print('Empty News')
示例#2
0
    if (article is not None):
        row['titulos'].append(article.title)
        row['noticia'].append(article.text)
        row['links'].append(article.url)
        row['abstract'].append(article.text)
        row['date'].append(article.date_publish)
        path_image = article.image_url
        print(path_image)
        if path_image == '' or path_image == None:
            row['image'].append(0)
        else:
            row['image'].append(download_and_move_image(article.image_url))
        news = News(row['abstract'], row['noticia'], row['date'], row['links'], row['titulos'], row['image'])
        try:
            print(row['titulos'])
            news_in_db = midia_table.check_news(news)
            print('news_in_db: ' + str(news_in_db))
            if (not news_in_db):
                row = pd.DataFrame(row)
                df, categories = midia_lexical.lexical_corpus_and_title(row)
                # DB categories
                if (categories != [set()]):
                    news.set_categories(categories)
                    midia_table.save_news(news)
                    midia_post.post_news(df)
        except:
            print('Empty News')


# In[ ]: