def test_language(self): def _check_lang(sample): blob = self.blob(sample['path']) assert blob.language, 'No language for %s' % sample['path'] assert sample['language'] == blob.language.name, blob.name Samples.each(_check_lang)
def test_classify_ambiguous_languages(self): def classify_ambiguous_languages(sample): language = Language.find_by_name(sample['language']) languages = Language.find_by_filename(sample['path']) languages_names = [x.name for x in languages] results = Classifier.classify(DATA, open(sample['path']).read(), languages_names) self.assertEqual(language.name, results[0][0]) samples = Samples() samples.generate() samples.each(classify_ambiguous_languages)