Python Document_Date_Archive_Url示例

编程语言: Python

命名空间/包名称: osp.dates.models.archive_url

hotexamples.com的示例: 3

Python Document_Date_Archive_Url - 已找到3个示例。这些是从开源项目中提取的最受好评的osp.dates.models.archive_url.Document_Date_Archive_Url现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

select(2)

create(1)

示例#1

显示文件

文件： ext_archive_url.py 项目： overview/osp

def ext_archive_url(doc_id):

    """
    Try to extract an Internet Archive timestamp from the URL.

    Args:
        doc_id (int): The document id.
    """

    doc = Document.get(Document.id==doc_id)

    match = re.search(
        'web\.archive\.org\/web\/(?P<timestamp>\d+)',
        doc.syllabus.url
    )

    if match:

        date = datetime.strptime(
            match.group('timestamp'),
            date_format
        )

        if date < datetime.now():

            return Document_Date_Archive_Url.create(
                document=doc,
                date=date
            )

示例#2

显示文件

文件： test_ext_archive_url.py 项目： overview/osp

def test_ignore_regular_url(ext):

    """
    When the syllabus was scraped from a regular URL, don't write a row.
    """

    row = ext('http://yale.edu/syllabus.html')

    # Shouldn't write a row.
    assert Document_Date_Archive_Url.select().count() == 0

示例#3

显示文件

文件： test_ext_archive_url.py 项目： overview/osp

def test_ignore_future_timestamp(ext):

    """
    Don't index timestamps from the future.
    """

    # Get now + 1 year.
    future = datetime.now() + relativedelta(years=1)
    timestamp = future.strftime(date_format)

    url1 = 'https://web.archive.org/web/'+timestamp
    url2 = 'http://yale.edu/syllabus.html'

    row = ext(url1+'/'+url2)

    # Shouldn't write a row.
    assert Document_Date_Archive_Url.select().count() == 0