def main(): dataset = QuizBowlDataset(guesser_train=True) questions = dataset.questions_by_fold([GUESSER_DEV_FOLD]) questions = questions[GUESSER_DEV_FOLD] correct = 0 for question in tqdm(questions): guess = recursive_guess(question.text[0], 3) correct += (guess == question.page) print(correct / len(questions))
def main(): dataset = QuizBowlDataset(guesser_train=True) questions = dataset.questions_by_fold([GUESSER_DEV_FOLD]) questions = questions[GUESSER_DEV_FOLD] correct = 0 for question in tqdm(questions): guess = recursive_guess(question.text[0], 3) correct += guess == question.page print(correct / len(questions))
def test(): dataset = QuizBowlDataset(guesser_train=True) questions = dataset.questions_by_fold([GUESSER_DEV_FOLD]) questions = questions[GUESSER_DEV_FOLD] i = 10 question = questions[i] guess = recursive_guess(question.text[0], k=1) print(question.page) print(question.text[0])
import json from qanta.util.constants import GUESSER_DEV_FOLD from qanta.datasets.quiz_bowl import QuizBowlDataset ''' Preprocess the questions from a database (like data/naqt.db) and extracts the text, qid and answer. Stores the data in sample_questions.json ''' dataset = QuizBowlDataset(guesser_train=True, qb_question_db='data/naqt.db') questions = dataset.questions_by_fold([GUESSER_DEV_FOLD])[GUESSER_DEV_FOLD] def convert(q): return {'qid': q.qnum, 'text': ' '.join(q.text.values()), 'answer': q.page} questions = [convert(q) for q in questions] with open('data/sample_questions.json', 'w') as f: f.write(json.dumps(questions))