Beispiel #1
0
def test_gooddoc_badlink():
    doc = Doc(url="http://umsu.de/papers/variations.pdf")
    doc.link = Link(url="http://umsu.de/papers/variations.pdf")
    doc.link.anchortext = "slides"
    doc.link.context = "The slides for my talk"
    doc.content = readfile(os.path.join(testdir, "attitudes.txt"))
    doc.numwords = 10200
    doc.numpages = 22
    doc.meta_confidence = 92
    assert paperfilter.evaluate(doc) < 0.8
Beispiel #2
0
def test_cv():
    doc = Doc(url="http://umsu.de/papers/cv.pdf")
    doc.link = Link(url="http://umsu.de/papers/cv.pdf")
    doc.link.anchortext = "CV"
    doc.link.context = "CV"
    doc.content = readfile(os.path.join(testdir, "cv.txt"))
    doc.numwords = 10200
    doc.numpages = 22
    doc.meta_confidence = 92
    assert paperfilter.evaluate(doc) < 0.4
Beispiel #3
0
def test_gooddoc():
    doc = Doc(url="http://umsu.de/papers/variations.pdf")
    doc.link = Link(url="http://umsu.de/papers/variations.pdf")
    doc.link.anchortext = "Download"
    doc.link.context = "Foo bar"
    doc.content = readfile(os.path.join(testdir, "attitudes.txt"))
    doc.numwords = 10200
    doc.numpages = 22
    doc.meta_confidence = 92
    assert paperfilter.evaluate(doc) > 0.98