def print_progress(self): print("Average tfidf: " + str(1 - self.sum_tfidf / self.queries_asked)) print("Average ngram-perplexity: " + str(self.sum_ngp / self.sentences_asked)) print("Average edit-distance: " + str(self.sum_edit / self.queries_asked)) print("Accept percent by tfidf extractor: " + Formatter.percent(self.accepted_by_tfidf / self.sentences_asked)) print("Accept percent by ngram-perplexity extractor: " + Formatter.percent(self.accepted_by_ngp / self.sentences_asked)) print("Accept percent by edit-distance extractor: " + Formatter.percent(self.accepted_by_edit_distance / self.sentences_asked))
def print_progress_summary(self): useful_lines = self.assigned_lines - self.unusable_lines print("(General corpora): Total lines scanned : " + str(self.scanned_lines)) print("(General corpora): Lines assigned to worker: " + str(self.assigned_lines)) print("(General corpora): Lines containing words: " + str(useful_lines)) print("(General corpora): Extracted lines: " + str(self.extracted_lines)) print("(General corpora): Sentence accept rate: " + Formatter.percent(self.extracted_lines / useful_lines))