Python News.set_url Examples

Programming Language: Python

Namespace/Package Name: news

Class/Type: News

Method/Function: set_url

Examples at hotexamples.com: 2

Python News.set_url - 2 examples found. These are the top rated real world Python examples of news.News.set_url extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

News(30)

title(5)

__init__(4)

find_news(4)

to_str(3)

date(3)

get_newlist(2)

get_news(2)

set_source(2)

set_posttime(2)

set_encoding(2)

print(2)

href(2)

id(2)

set_url(2)

set_date(2)

set_content(2)

list(2)

set_author(2)

news(2)

set_title(2)

from_feed(2)

save(2)

from_dict(2)

source_url(2)

url(2)

content(2)

topNewsHeadlines(1)

search_new(1)

url_to_image(1)

search_term(1)

update_new(1)

type(1)

set_data(1)

to_csv(1)

to_dict(1)

show(1)

tag(1)

stopflag(1)

start_thread(1)

set_target(1)

source(1)

set_target_names(1)

sort(1)

Hotlines(1)

loadfromdb(1)

run(1)

format_news(1)

add_new(1)

analyze_count(1)

Example #1

Show file

File: sp_elfinance_ingest.py Project: Tskatom/Finance

def get_news_by_url(url):
    news = News()
    try:
        soup = BeautifulSoup(urllib2.urlopen(url))

        #title
        title = soup.find("div", "pg-story-head md").find("h2").text
        news.set_title(title)

        #postTime
        author_posttime = soup.find("p", "dateline").text.replace("\n","").lower().replace("\t","").split("/")
        post_time = author_posttime[1].replace("pm", "").replace("am", "").strip()
        
        t_format = "%d %b %Y, %I:%M"
        post_time = datetime.strptime(post_time, t_format).isoformat()
        news.set_posttime(post_time)

        #author
        author = author_posttime[0]
        news.set_author(author)

        #url
        news.set_url(url)

        #date
        date = datetime.utcnow().isoformat()
        news.set_date(date)

        #source
        source = 'elfinancierocr'
        news.set_source(source)

        #content, encoding, id, country, labels
        paragraphs = soup.find("div", "pg-story-body mce").find_all('p')
        content = " ".join([unicode(p.text) for p in paragraphs])
        news.set_content(content)

        #encoding
        encoding = 'utf-8'
        news.set_encoding(encoding)

        news.news = message.add_embers_ids(news.news)

        return news.news
    except:
        log.exception("Exceptopn when extracting %s %s" % (url, sys.exc_info()[0]))
        return None

Example #2

Show file

File: sp_reuters_ingest.py Project: Tskatom/Finance

def get_news_by_url(url):
    news = News()
    try:
        soup = BeautifulSoup(urllib2.urlopen(url))

        # title
        title = soup.find_all("h1")[0].text
        news.set_title(title)

        # postTime
        post_time = soup.select('meta[name="REVISION_DATE"]')[0]["content"]
        t_format = "%a %b %d %H:%M:%S %Z %Y"
        post_time = datetime.strptime(post_time, t_format).isoformat()
        news.set_posttime(post_time)

        # author
        author = soup.select('meta[name="Author"]')[0]["content"]
        news.set_author(author)

        # url
        news.set_url(url)

        # date
        date = datetime.utcnow().isoformat()
        news.set_date(date)

        # source
        source = "lta_reuters"
        news.set_source(source)

        # content, encoding, id, country, labels
        paragraphs = soup.find(id="resizeableText").find_all("p")
        content = " ".join([unicode(p.text) for p in paragraphs])
        news.set_content(content)

        # encoding
        encoding = "utf-8"
        news.set_encoding(encoding)

        news.news = message.add_embers_ids(news.news)

        return news.news
    except:
        log.exception("Exceptopn when extracting %s %s" % (url, sys.exc_info()[0]))
        return None