def __init__(self, corrections=None, spoken=None, target=None): self.train_path, self.dev_path, self.test_path = filepaths() self.trainset, self.devset, self.testset = returnDatasets() self.languages_known = Counter() self.languages_learning = Counter() self.languages = languages() self.ch = CorrectionHelper(corrections, spoken, target)
class DataCleaner: def __init__(self, corrections=None, spoken=None, target=None): self.train_path, self.dev_path, self.test_path = filepaths() self.trainset, self.devset, self.testset = returnDatasets() self.languages_known = Counter() self.languages_learning = Counter() self.languages = languages() self.ch = CorrectionHelper(corrections, spoken, target) def astrip(self, string): return asciistrip(string) def cleanCorrections(self): return self.ch.extractAndCleanCorrections()