def prepare_document(self, num, language, authors): d, tf = DocumentReader.prepare_document(self, num, language, authors) d.date.day = self.date_["day"] d.date.month = self.date_["month"] d.date.year = self.date_["year"] d.rating = self.rating assert language == self.lang d.id = num d.title = self.filename_ + "\t" + self.title_ return d, tf
def __init__(self, filename, lang): DocumentReader.__init__(self, "") self.filename = filename self.lang = lang self.parse_from_file(filename)