def test_gooddoc_badlink(): doc = Doc(url="http://umsu.de/papers/variations.pdf") doc.link = Link(url="http://umsu.de/papers/variations.pdf") doc.link.anchortext = "slides" doc.link.context = "The slides for my talk" doc.content = readfile(os.path.join(testdir, "attitudes.txt")) doc.numwords = 10200 doc.numpages = 22 doc.meta_confidence = 92 assert paperfilter.evaluate(doc) < 0.8
def test_cv(): doc = Doc(url="http://umsu.de/papers/cv.pdf") doc.link = Link(url="http://umsu.de/papers/cv.pdf") doc.link.anchortext = "CV" doc.link.context = "CV" doc.content = readfile(os.path.join(testdir, "cv.txt")) doc.numwords = 10200 doc.numpages = 22 doc.meta_confidence = 92 assert paperfilter.evaluate(doc) < 0.4
def test_gooddoc(): doc = Doc(url="http://umsu.de/papers/variations.pdf") doc.link = Link(url="http://umsu.de/papers/variations.pdf") doc.link.anchortext = "Download" doc.link.context = "Foo bar" doc.content = readfile(os.path.join(testdir, "attitudes.txt")) doc.numwords = 10200 doc.numpages = 22 doc.meta_confidence = 92 assert paperfilter.evaluate(doc) > 0.98