Python Article.top_imageの例

プログラミング言語: Python

名前空間/パッケージ名: newspaper

クラス/型: Article

メソッド/関数: top_image

hotexamples.comのコード掲載数: 3

Python Article.top_image - 3件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのnewspaper.Article.top_imageの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Article(30)

nlp(30)

set_html(30)

parse(30)

download(30)

build(20)

html(15)

text(11)

download_state(9)

fetch_images(6)

is_valid_url(6)

publish_date(5)

authors(5)

is_downloaded(5)

title(4)

top_image(3)

article_html(3)

keywords(3)

set_text(2)

images(2)

has_top_image(2)

is_valid_body(2)

summary(1)

summarylen(1)

split(1)

set_top_img_no_check(1)

tag(1)

set_title(1)

tags(1)

textlen(1)

set_meta_data(1)

lower(1)

set_keywords(1)

save(1)

prepareSentenceHighlights(1)

nlpEntropy(1)

meta_data(1)

append(1)

is_video(1)

is_parsed(1)

is_media_news(1)

has_video(1)

get_is_news(1)

format_top_node(1)

category_urls(1)

articles(1)

url(1)

コード例 #1

ファイルを表示

def test_convert_to_dict_most_fields_works():
    faker = Faker()

    source = Article(url=faker.url())

    source.authors = [faker.name(), faker.name()]
    source.top_image = faker.image_url()
    source.article_html = faker.text()
    source.images = [faker.image_url(), faker.image_url()]
    source.meta_data = [faker.city(), faker.state(), faker.country()]

    result = extractor.to_dict(source, "article_html", "authors", "images",
                               "keywords", "meta_data", "source_url",
                               "summary", "top_image", "url", "tags",
                               "meta_favicon")

    assert result
    assert len(result) == 7

    assert "article_html" in result
    assert "authors" in result
    assert "images" in result
    assert "keywords" not in result
    assert "meta_data" in result
    assert "source_url" in result
    assert "summary" not in result
    assert "top_image" in result
    assert "url" in result
    assert "tags" not in result
    assert "meta_favicon" not in result

コード例 #2

ファイルを表示

ファイル: server.py プロジェクト: arjun11verma/OctoDash

def getArticleInfo():
    post_data = (literal_eval(request.data.decode('utf8')))
    country = post_data["country"]
    articleInfo = {}
    urls = getNewsUrls(country)
    count = 0
    goodCount = 0
    while count < len(urls):
        article = Article(urls[count])
        try:
            article.download()
            article.parse()
            if (isinstance(article.publish_date, datetime)):
                date = article.publish_date.strftime('%m/%d/%Y')
            else:
                date = article.publish_date
            authors = []
            for x in article.authors:
                if len(x.split(" ")) == 2:
                    authors.append(x)
            if not authors:
                authors[0] = "No Author"
            if date == None:
                date = "No Date"
            if article.top_image == None:
                article.top_image = "No imageURL"
            if article.title == None:
                article.title = "No title"
            if count != 0 and goodCount != 0 and urls[count] == articleInfo[
                    goodCount - 1]["url"]:
                print("Inside if statement")
                raise Exception
            articleInfo[goodCount] = {
                "authors": authors,
                "date": date,
                "url": urls[count],
                "imageURL": article.top_image,
                "title": article.title
            }
            count = count + 1
            goodCount = goodCount + 1
        except Exception as e:
            print(e)
            count = count + 1
            print("bad article")
    return articleInfo

コード例 #3

ファイルを表示

pip install nltk

pip install newspaper3k

import nltk
from newspaper import Article

url = 'https://www.cnbc.com/2020/03/19/ecb-launches-new-820-billion-coronavirus-package.html'
article= Article(url)

article.download()
article.parse()
nltk.download('punkt')
article.nlp()

# get the authors
article.authors

# get the authors
article.publish_date()

article.top_image()

print(article.text)

# get summary of the artile 
print(article.summary)