def setUpClass(cls): cls.dataset = Dataset() cls.doc = Document() cls.dataset.documents['testid'] = cls.doc # TEXT = "123 45678" # POS = "012345678" # ANN1 = " X " # ANN2 = " XXX " # PAR1 = "XXX " # PAR1 = " XXXXX" part1 = Part('123') part2 = Part('45678') ann1 = Entity(class_id=STUB_ENTITY_CLASS_ID, offset=1, text='2', confidence=0) ann2 = Entity(class_id=STUB_ENTITY_CLASS_ID, offset=1, text='567', confidence=1) ann1.subclass = 0 ann2.subclass = 2 part1.annotations.append(ann1) part2.annotations.append(ann2) cls.doc.parts['s1h1'] = part1 cls.doc.parts['s2p1'] = part2 doc2 = Document() doc3 = Document().parts['someid'] = Part('marmor stein und eisen') cls.dataset2 = Dataset() cls.dataset2.documents['newid'] = doc3 cls.dataset2.documents['testid'] = doc2
def setUpClass(cls): # create a sample dataset1 (1) to test cls.dataset1 = Dataset() doc_1 = Document() text = '.... aaaa .... bbbb .... cccc .... dddd .... eeee .... ffff .... gggg .... hhhh .... jjjj' part_1 = Part(text) cls.dataset1.documents['doc_1'] = doc_1 doc_1.parts['part_1'] = part_1 exact_1 = Entity(STUB_E_ID_1, 5, 'aaaa') exact_1.subclass = 1 exact_2 = Entity(STUB_E_ID_1, 55, 'ffff') exact_2.subclass = 2 exact_3 = Entity(STUB_E_ID_1, 75, 'hhhh') exact_3.subclass = 2 overlap_1_1 = Entity(STUB_E_ID_1, 25, 'cccc') overlap_1_1.subclass = 1 overlap_1_2 = Entity(STUB_E_ID_1, 26, 'cc') overlap_1_2.subclass = 1 overlap_2_1 = Entity(STUB_E_ID_1, 32, '.. ddd') overlap_2_1.subclass = 2 overlap_2_2 = Entity(STUB_E_ID_1, 36, 'ddd ...') overlap_2_2.subclass = 2 overlap_3_1 = Entity(STUB_E_ID_1, 65, 'gggg') overlap_3_1.subclass = 1 overlap_3_2 = Entity(STUB_E_ID_1, 62, '.. gggg ..') overlap_3_2.subclass = 2 missing_1 = Entity('e2', 45, 'eeee') missing_1.subclass = 1 missing_2 = Entity('e2', 84, 'jjjj') missing_2.subclass = 1 spurios = Entity('e2', 15, 'bbbb') spurios.subclass = 1 part_1.annotations = [exact_1, exact_2, exact_3, overlap_1_1, overlap_2_1, overlap_3_1, missing_1, missing_2] part_1.predicted_annotations = [exact_1, exact_2, exact_3, overlap_1_2, overlap_2_2, overlap_3_2, spurios]