def test_get_inner_xml(self): tag = self.document.getElementsByTagName('Foo')[0] inner_xml = "some text"\ " <Bar name=\"a\">Bar A</Bar>"\ " <Bar name=\"b\">Bar B</Bar>" self.assertEqual(get_inner_xml(tag), inner_xml) self.assertEqual(get_inner_xml(self.document), sample_xml)
def _get_title(self): try: notes = [] for tag in self.document.getElementsByTagName('article-title'): for note in tag.getElementsByTagName('xref'): if note.getAttribute('ref-type') == 'fn': tag.removeChild(note) notes.append(note.getAttribute('rid')) return get_inner_xml(tag), get_value_in_tag(self.document, 'subtitle'), notes except Exception: print("Can't find title", file=sys.stderr) return '', '', ''
def _get_title(self): try: notes = [] for tag in self.document.getElementsByTagName('article-title'): for note in tag.getElementsByTagName('xref'): if note.getAttribute('ref-type') == 'fn': tag.removeChild(note) notes.append(note.getAttribute('rid')) return get_inner_xml(tag), get_value_in_tag( self.document, 'subtitle'), notes except Exception: print("Can't find title", file=sys.stderr) return '', '', ''
def _get_abstract(self): for tag in self.document.getElementsByTagName('abstract'): return get_inner_xml(tag)