def test_iop_issueletter(self): test_infile = os.path.join(self.inputdir, 'iop_ansnn_issueletter.xml') parser = iop.IOPJATSParser() with open(test_infile, open_mode_u) as fp: input_data = fp.read() test_data = parser.parse(input_data) output_bibcode = '2021ANSNN..12b5001V' self.assertEqual(test_data['bibcode'], output_bibcode) return
def test_iop_parser(self): test_infile = os.path.join(self.inputdir, 'iop_apj.xml') parser = iop.IOPJATSParser() config.REFERENCE_TOPDIR = '/dev/null/' with open(test_infile) as fp: test_data = parser.parse(fp) output_bibcode = '2019ApJ...882...74H' output_pub = u'The Astrophysical Journal, Volume 882, Issue 2, id.74, <NUMPAGES>13</NUMPAGES> pp.' output_aff = [u'Department of Physics, The George Washington University, 725 21st St. NW, Washington, DC 20052, USA; The George Washington Astronomy, Physics, and Statistics Institute of Sciences (APSIS), The George Washington University, Washington, DC 20052, USA; Space Sciences Laboratory, 7 Gauss Way, University of California, Berkeley, CA 94720-7450, USA; <id system="ORCID">0000-0002-8548-482X</id>; <email>[email protected]</email>', u'Department of Physics, The George Washington University, 725 21st St. NW, Washington, DC 20052, USA; The George Washington Astronomy, Physics, and Statistics Institute of Sciences (APSIS), The George Washington University, Washington, DC 20052, USA; <id system="ORCID">0000-0002-6447-4251</id>', u'Department of Astronomy & Astrophysics, Pennsylvania State University, 525 Davey Lab, University Park, PA 16802, USA; <id system="ORCID">0000-0002-7481-5259</id>', u'Department of Physics, The George Washington University, 725 21st St. NW, Washington, DC 20052, USA; The George Washington Astronomy, Physics, and Statistics Institute of Sciences (APSIS), The George Washington University, Washington, DC 20052, USA; <id system="ORCID">0000-0001-7833-1043</id>'] self.assertEqual(test_data['bibcode'], output_bibcode) self.assertEqual(test_data['publication'], output_pub) self.assertEqual(test_data['affiliations'], output_aff) return
def test_iop_entities(self): test_infile = os.path.join(self.inputdir, 'iop_aj_accentnames.xml') parser = iop.IOPJATSParser() with open(test_infile, open_mode_u) as fp: input_data = fp.read() # Note the earlier format of IOP/STACKS content was NLM, not JATS # For this particular test, you need to specify the 'lxml' parser, # to override the jats default 'lxml-xml' (strict) parser # test_data = parser.parse(input_data) test_data = parser.parse(input_data, parser='lxml') output_title = 'Meteoroid Stream of Comet C/1961 T1 (Seki) and Its Relation to the December &rgr;-Virginids and γ-Sagittariids' output_authors = 'Neslušan, Luboš; Hajduková, Mária' output_affiliations = [ 'Astronomical Institute, Slovak Academy of Science, 05960 Tatranská Lomnica, Slovakia; <ID system="ORCID">0000-0001-9758-1144</ID> <EMAIL>[email protected]</EMAIL>', 'Astronomical Institute, Slovak Academy of Science, Dúbravská cesta 9, 84504 Bratislava, Slovakia; <ID system="ORCID">0000-0002-7837-2627</ID>' ] self.assertEqual(test_data['title'], output_title) self.assertEqual(test_data['authors'], output_authors) self.assertEqual(test_data['affiliations'], output_affiliations) return
def test_iop_parser(self): test_infile = os.path.join(self.inputdir, 'iop_apj.xml') parser = iop.IOPJATSParser() with open(test_infile, open_mode_u) as fp: input_data = fp.read() test_data = parser.parse(input_data) # # save temporary copy of data structure # target_saved = test_infile.replace('input','parsed') + '.parsed.NEW' # with open(target_saved, 'w') as fp: # json.dump(test_data, fp, sort_keys=True, indent=4) output_bibcode = '2019ApJ...882...74H' output_pub = u'The Astrophysical Journal, Volume 882, Issue 2, id.74, <NUMPAGES>13</NUMPAGES> pp.' output_aff = [ u'Department of Physics, The George Washington University, 725 21st St. NW, Washington, DC 20052, USA; The George Washington Astronomy, Physics, and Statistics Institute of Sciences (APSIS), The George Washington University, Washington, DC 20052, USA; Space Sciences Laboratory, 7 Gauss Way, University of California, Berkeley, CA 94720-7450, USA; <ID system="ORCID">0000-0002-8548-482X</ID> <EMAIL>[email protected]</EMAIL>', u'Department of Physics, The George Washington University, 725 21st St. NW, Washington, DC 20052, USA; The George Washington Astronomy, Physics, and Statistics Institute of Sciences (APSIS), The George Washington University, Washington, DC 20052, USA; <ID system="ORCID">0000-0002-6447-4251</ID>', u'Department of Astronomy & Astrophysics, Pennsylvania State University, 525 Davey Lab, University Park, PA 16802, USA; <ID system="ORCID">0000-0002-7481-5259</ID>', u'Department of Physics, The George Washington University, 725 21st St. NW, Washington, DC 20052, USA; The George Washington Astronomy, Physics, and Statistics Institute of Sciences (APSIS), The George Washington University, Washington, DC 20052, USA; <ID system="ORCID">0000-0001-7833-1043</ID>' ] self.assertEqual(test_data['bibcode'], output_bibcode) self.assertEqual(test_data['publication'], output_pub) self.assertEqual(test_data['affiliations'], output_aff) return