def test_hnews():
    link_annotation = page_finder.LinkAnnotation()
    link_annotation.load(
        extract_all_links(get_local_url('Hacker News 1.html')))
    link_annotation.mark_link('https://news.ycombinator.com/news?p=2')
    link_annotation.load(
        extract_all_links(get_local_url('Hacker News 2.html')))

    best = link_annotation.best_links_to_follow()

    assert(best[0] == 'https://news.ycombinator.com/news?p=2')
    assert(best[1] == 'https://news.ycombinator.com/news?p=3')

    link_annotation.prune(100)
    assert(len(link_annotation.links) <= 100)

    assert(best[0] == 'https://news.ycombinator.com/news?p=2')
    assert(best[1] == 'https://news.ycombinator.com/news?p=3')
Example #2
0
def test_hnews():
    link_annotation = page_finder.LinkAnnotation()
    link_annotation.load(extract_all_links(
        get_local_url('Hacker News 1.html')))
    link_annotation.mark_link('https://news.ycombinator.com/news?p=2')
    link_annotation.load(extract_all_links(
        get_local_url('Hacker News 2.html')))

    best = link_annotation.best_links_to_follow()

    assert (best[0] == 'https://news.ycombinator.com/news?p=2')
    assert (best[1] == 'https://news.ycombinator.com/news?p=3')

    link_annotation.prune(100)
    assert (len(link_annotation.links) <= 100)

    assert (best[0] == 'https://news.ycombinator.com/news?p=2')
    assert (best[1] == 'https://news.ycombinator.com/news?p=3')
Example #3
0
 def visit(self, page, start=False):
     self.link_annotation.load(extract_all_links(page))
     self.visited.add(page)
     if not start:
         self.link_annotation.mark_link(page)