Example #1
0
 def test_reconcile_TIMEX_SET(self):
     s = Timex2XmlDocument('<root>This is some annotated text.</root>')
     t = Timex(type='set')
     t.value = "P6M"
     t.mod = "BEFORE"
     s.reconcile([[('This', 'POS', set()), ('is', 'POS', set()), ('some', 'POS', set([t])), ('annotated', 'POS', set([t])), ('text', 'POS', {t}), ('.', 'POS', set())]])
     self.assertEqual(str(s), xml.dom.minidom.parseString('<root>This is <TIMEX2 PERIODICITY="F6M" MOD="BEFORE" SET="YES">some annotated text</TIMEX2>.</root>').toxml())
Example #2
0
 def test_timex_set_to_sents(self):
     d = Timex2XmlDocument(
         '<root>This is <TIMEX2 PERIODICITY="F3D" SET="YES">a timex</TIMEX2>.</root>'
     )
     s = d.get_sents()
     t = s[0][2][2].pop()
     self.assertEquals(t.type, 'set')
     self.assertEquals(t.value, 'P3D')
Example #3
0
 def test_timex_to_sents(self):
     d = Timex2XmlDocument('<root>This is <TIMEX2 VAL="20100701" MOD="BEFORE" NON_SPECIFIC="YES" GRANUALITY="G1D" COMMENT="Text">a timex</TIMEX2>.</root>')
     s = d.get_sents()
     t = s[0][2][2].pop()
     self.assertEqual(t.type, None)
     self.assertEqual(t.value, '20100701')
     self.assertEqual(t.mod, 'BEFORE')
     self.assertEqual(t.freq, "1D")
     self.assertEqual(t.comment, "Text")
Example #4
0
 def test_reconcile_TIMEX(self):
     s = Timex2XmlDocument('<root>This is some annotated text.</root>')
     t = Timex(type='date')
     t.value = "20100710"
     t.mod = "BEFORE"
     t.freq = "1M"
     t.comment = "Test"
     s.reconcile([[('This', 'POS', set()), ('is', 'POS', set()), ('some', 'POS', {t}), ('annotated', 'POS', {t}), ('text', 'POS', {t}), ('.', 'POS', set())]])
     self.assertEqual(str(s), xml.dom.minidom.parseString('<root>This is <TIMEX2 VAL="20100710" MOD="BEFORE" COMMENT="Test" GRANUALITY="G1M">some annotated text</TIMEX2>.</root>').toxml())
Example #5
0
 def test_strip_timexes(self):
     t = Timex2XmlDocument(
         '<root>This is some <TIMEX2 attr="timex">annotated <TIMEX2>embedded annotated </TIMEX2>text</TIMEX2>.</root>'
     )
     t.strip_timexes()
     self.assertEquals(
         str(t),
         xml.dom.minidom.parseString(
             '<root>This is some annotated embedded annotated text.</root>'
         ).toxml())
Example #6
0
 def test_timex_to_sents_SET(self):
     d = Timex2XmlDocument(
         '<root>This is <TIMEX2 SET="YES">a timex</TIMEX2>.</root>')
     s = d.get_sents()
     t = s[0][2][2].pop()
     self.assertEquals(t.type, 'set')