Python WikiExtractor示例

编程语言: Python

命名空间/包名称: annotated_wikiextractor.wikiextractor

类/类型: WikiExtractor

hotexamples.com的示例: 4

Python WikiExtractor - 已找到4个示例。这些是从开源项目中提取的最受好评的annotated_wikiextractor.wikiextractor.WikiExtractor现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

WikiExtractor(1)

extract(1)

示例#1

显示文件

class TestAnnotatedWikiExtractor(unittest.TestCase):
    def setUp(self):
        self.annotated_wikiextractor = AnnotatedWikiExtractor()
        self.wikiextractor = WikiExtractor()

    """
    Test the extraction process by comparing the result with a pre-processed result
    serialized in the file singlepage_original.xml
    
    This test targets the script in wikiextractor.py
    """

    def test_extract_original(self):
        page = map(lambda x: x.rstrip("\n"),
                   open("resources/singlepage_wikien.txt", "r").readlines())
        wiki_document = annotated_wikiextractor.wikiextractor.extract_document(
            page)
        wiki_document = self.wikiextractor.extract(wiki_document)

        #create test file:
        #open("resources/singlepage_original.xml", "w").write(wiki_document.__str__())

        self.assertEquals(
            open("resources/singlepage_original.xml").read(),
            wiki_document.__str__())

    """
    Test the extraction process by comparing the result with a pre-processed result
    serialized in the file singlepage_annotated.json
    
    This test targets the script in annotated_wikiextractor.py
    """

    def test_extract_annotated(self):
        page = map(lambda x: x.rstrip("\n"),
                   open("resources/singlepage_wikien.txt", "r").readlines())
        wiki_document = annotated_wikiextractor.wikiextractor.extract_document(
            page)
        annotated_wiki_document = self.annotated_wikiextractor.extract(
            wiki_document)

        #create test file:
        #json.dump(json.loads(str(annotated_wiki_document)), open("resources/singlepage_annotated.json", "w"))

        self.assertEquals(
            open("resources/singlepage_annotated.json").read(),
            json.dumps(annotated_wiki_document))

示例#2

显示文件

文件： test_annotated_wikiextractor.py 项目： balusamy/Annotated-WikiExtractor

class TestAnnotatedWikiExtractor(unittest.TestCase):
    
    def setUp(self):
        self.annotated_wikiextractor = AnnotatedWikiExtractor()
        self.wikiextractor = WikiExtractor()
    
    """
    Test the extraction process by comparing the result with a pre-processed result
    serialized in the file singlepage_original.xml
    
    This test targets the script in wikiextractor.py
    """
    def test_extract_original(self):
        page = map(lambda x: x.rstrip("\n"), open("resources/singlepage_wikien.txt", "r").readlines())
        wiki_document = annotated_wikiextractor.wikiextractor.extract_document(page)
        wiki_document = self.wikiextractor.extract(wiki_document)
        
        #create test file: 
        #open("resources/singlepage_original.xml", "w").write(wiki_document.__str__())
        
        self.assertEquals(open("resources/singlepage_original.xml").read(), wiki_document.__str__())   

    
    """
    Test the extraction process by comparing the result with a pre-processed result
    serialized in the file singlepage_annotated.json
    
    This test targets the script in annotated_wikiextractor.py
    """
    def test_extract_annotated(self):
        page = map(lambda x: x.rstrip("\n"), open("resources/singlepage_wikien.txt", "r").readlines())
        wiki_document = annotated_wikiextractor.wikiextractor.extract_document(page)
        annotated_wiki_document = self.annotated_wikiextractor.extract(wiki_document)
        
        #create test file: 
        #json.dump(json.loads(str(annotated_wiki_document)), open("resources/singlepage_annotated.json", "w"))
        
        self.assertEquals(open("resources/singlepage_annotated.json").read(), json.dumps(annotated_wiki_document))

示例#3

显示文件

 def setUp(self):
     self.annotated_wikiextractor = AnnotatedWikiExtractor()
     self.wikiextractor = WikiExtractor()

示例#4

显示文件

文件： test_annotated_wikiextractor.py 项目： balusamy/Annotated-WikiExtractor

 def setUp(self):
     self.annotated_wikiextractor = AnnotatedWikiExtractor()
     self.wikiextractor = WikiExtractor()