示例#1
0
    def test_list_url_format(self):
        dump_url = get_wikidump_url()
        list_url_wikidump = get_list_downloads_wikidump(dump_url=dump_url)

        def check_format(url_info):
            url = url_info[0]
            return (('pages-articles' in url) and ('xml-p' in url)
                    and ('multistream' not in url))

        assert [url for url in list_url_wikidump if check_format(url)]
示例#2
0
 def test_unicity_list_url(self):
     dump_url = get_wikidump_url()
     list_url_wikidump = get_list_downloads_wikidump(dump_url=dump_url)
     urls = [url_info[0] for url_info in list_url_wikidump]
     assert len(urls) == len(list(set(urls)))
示例#3
0
 def test_format_date_wikidump_url(self):
     dump_url = get_wikidump_url()
     latest_date = dump_url.split('/')[-2]
     assert (len(latest_date) == 8 and latest_date.isdigit())
示例#4
0
 def test_get_list_downloads_wikidump(self):
     dump_url = get_wikidump_url()
     list_url_wikidump = get_list_downloads_wikidump(dump_url=dump_url)
     assert list_url_wikidump
示例#5
0
 def test_get_wikidump_url(self):
     dump_url = get_wikidump_url()
     assert "https://dumps.wikimedia.org/enwiki/"\
         in dump_url