Esempio n. 1
0
 def test_filter_datasets_by_language(self):
     _api = HfApi()
     f = DatasetFilter(languages="en")
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue("languages:en" in datasets[0].tags)
     args = DatasetSearchArguments()
     f = DatasetFilter(languages=(args.languages.en, args.languages.fr))
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue("languages:en" in datasets[0].tags)
     self.assertTrue("languages:fr" in datasets[0].tags)
Esempio n. 2
0
 def test_filter_datasets_by_task_ids(self):
     _api = HfApi()
     f = DatasetFilter(task_ids="automatic-speech-recognition")
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue(
         "task_ids:automatic-speech-recognition" in datasets[0].tags)
Esempio n. 3
0
 def test_filter_datasets_by_task_categories(self):
     _api = HfApi()
     f = DatasetFilter(task_categories="audio-classification")
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue(
         "task_categories:audio-classification" in datasets[0].tags)
Esempio n. 4
0
 def test_filter_datasets_by_author_and_name(self):
     _api = HfApi()
     f = DatasetFilter(author="huggingface",
                       dataset_name="DataMeasurementsFiles")
     datasets = _api.list_datasets(filter=f)
     self.assertEqual(len(datasets), 1)
     self.assertTrue("huggingface" in datasets[0].author)
     self.assertTrue("DataMeasurementsFiles" in datasets[0].id)
Esempio n. 5
0
 def test_filter_datasets_by_size_categories(self):
     _api = HfApi()
     f = DatasetFilter(size_categories="100K<n<1M")
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue("size_categories:100K<n<1M" in datasets[0].tags)
Esempio n. 6
0
 def test_filter_datasets_by_multilinguality(self):
     _api = HfApi()
     f = DatasetFilter(multilinguality="yes")
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue("multilinguality:yes" in datasets[0].tags)
Esempio n. 7
0
 def test_filter_datasets_by_language_creator(self):
     _api = HfApi()
     f = DatasetFilter(language_creators="crowdsourced")
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue("language_creators:crowdsourced" in datasets[0].tags)
Esempio n. 8
0
 def test_filter_datasets_by_benchmark(self):
     _api = HfApi()
     f = DatasetFilter(benchmark="raft")
     datasets = _api.list_datasets(filter=f)
     self.assertGreater(len(datasets), 0)
     self.assertTrue("benchmark:raft" in datasets[0].tags)