def test_vietnamese(self): t = Tokenizer() input, gold = jipa("Vietnamese_input.txt", "Vietnamese_output.txt") result = t.tokenize_ipa(input) self.assertEqual(result, gold)
def test_german(self): t = Tokenizer() input, gold = jipa("Zurich_German_input.txt", "Zurich_German_output.txt") result = t.tokenize_ipa(input) self.assertEqual(result, gold)
def test_kabiye(self): t = Tokenizer() input, gold = jipa("Kabiye_input.txt", "Kabiye_output.txt") result = t.tokenize_ipa(input) self.assertEqual(result, gold)
def test_portuguese(self): t = Tokenizer() input, gold = jipa("Brazilian_Portuguese_input.txt", "Brazilian_Portuguese_output.txt") result = t.tokenize_ipa(input) self.assertEqual(result, gold)
def test_tokenize_ipa(self): t = Tokenizer() t.tokenize_ipa("Màttís List")