def test_truncate_pagemasters_slugline(self): filename = 'National Top Ten By Volume at Close - March 13.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' parser = ZCZCPMFParser() self.items = parser.parse(fixture, self.provider) parser.post_process_item(self.items, self.provider) self.assertEqual(self.items.get('slugline'), 'National Top Ten By Volume at ')
def test_greyhound_divs(self): filename = 'Warragul Greyhound NSW TAB DIVS 1-11 Thursday.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' self.items = ZCZCPMFParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Warragul Greyhound NSW TAB DIVS 1-11 Thursday') self.assertEqual(self.items.get('slugline'), 'Warragul Greys') self.assertEqual(self.items.get('anpa_take_key'), 'NSW TAB DIVS 1-11') self.assertEqual(self.items.get('genre')[0]['name'], 'Results (sport)')
def test_pagemasters_market(self): filename = 'Caulfield RA - Betting - Sat 11 Feb, 2017.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' parser = ZCZCPMFParser() self.items = parser.parse(fixture, self.provider) parser.post_process_item(self.items, self.provider) self.assertEqual(self.items.get('slugline'), 'Caulfield Market') self.assertEqual(self.items.get('anpa_take_key'), 'Saturday') self.assertEqual(self.items.get('headline'), 'Caulfield Market Saturday')
def test_trot_tab_divs(self): filename = 'Wagga Trot VIC TAB DIVS 1-4 Friday.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' self.items = ZCZCPMFParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Wagga Trot VIC TAB DIVS 1-4 Friday') self.assertEqual(self.items.get('slugline'), 'Wagga Trot') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'r') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030003') self.assertEqual(self.items.get('genre')[0]['name'], 'Results (sport)')
def test_pagemasters_format(self): filename = 'Darwin GR - Greys - Sun 11 Oct, 2015.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' self.items = ZCZCPMFParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Darwin Greyhound Fields Sunday') self.assertEqual(self.items.get('slugline'), 'Darwin Grey') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'r') self.assertEqual(self.items.get('subject')[0]['qcode'], '15082000') self.assertEqual(self.items.get('genre')[0]['name'], 'Results (sport)')
def test_medianet_investor_relations_format(self): filename = 'ED_867485_4_2.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'MNET' self.items = ZCZCMedianetParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'IRW News Release: Master Builders Australia')
def test_weights(self): filename = 'viwhtn01_8594.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'STRADBROKE HANDICAP 1400M .=!') self.assertEqual(self.items.get('slugline'), 'STRADBROKE HANDICAP 1400') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001')
def test_medianet_format(self): filename = 'ED_841066_2_1.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'MNET' self.items = ZCZCMedianetParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Media Release: Australian Financial Security Authority') self.assertEqual(self.items.get('place')[0], {'qcode': 'FED', 'name': 'FED'}) self.assertEqual(self.items.get('subject')[0]['qcode'], '04000000') self.assertEqual(len(self.items.get('anpa_take_key')), 24)
def test_racing_format_3(self): filename = 'vicomb004_8511.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Eagle Farm MARKET DAY') self.assertEqual(self.items.get('slugline'), 'Eagle Farm MARKET DAY') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001')
def test_racing_format(self): filename = 'viflda004_7257.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), ' Racing.Com Park FIELDS Thursday') self.assertEqual(self.items.get('slugline'), ' Racing.Com Park FIELDS ') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001')
def test_leading_jockeys(self): filename = 'vinlpt_8390.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Leading jockeys (Sydney)') self.assertEqual(self.items.get('slugline'), 'Leading jockeys (Sydney)') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001')
def test_default_format(self): filename = 'Standings__2014_14_635535729050675896.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'SOMETHING' self.items = ZCZCFeedParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'MOTOR: Collated results/standings after Sydney NRMA 500') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'T') self.assertEqual(self.items.get('subject')[0]['qcode'], '15039001') self.assertIn('versioncreated', self.items)
def test_sports_results_preview_format(self): filename = 'AFL_FormGuide__636241349261119029.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'SOMETHING' self.items = ZCZCSportsResultsParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'AFL: AFL Round 23 preview panel') self.assertTrue(self.items.get('body_html').startswith('<p>MELBOURNE, March 3 AAP - Preview of ' 'AFL Round 23 matches (all times AEDT):</p>')) self.assertTrue('<br>Tip:' in self.items.get('body_html'))
def test_racing_format_2(self): filename = 'vifrc7_5254.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Wodonga Comment Saturday races 1-6') self.assertEqual(self.items.get('slugline'), 'Wodonga Comment') self.assertEqual(self.items.get('anpa_take_key'), 'Saturday races 1-6') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001')
def test_bob(self): filename = '1487e8f1-f7f5-40f5-8c0f-0eba3c2e162d.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BOB' self.items = ZCZCBOBParser().parse(fixture, self.provider) self.assertEqual(self.items.get('slugline'), 'Legionella_BC1') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'A') self.assertEqual(self.items.get('headline'), 'QLD: Legionella found in Qld hospital') self.assertEqual(self.items.get('anpa_take_key'), '(BRISBANE)') self.assertEqual(self.items.get('subject')[0]['qcode'], '07000000') self.assertTrue(self.items.get('body_html').startswith('<p>Legionella bacteria has been found in a regional'))
def test_bob_empty_header_line(self): filename = '612fa1dc-c476-425d-8c80-d40bdc9cc1d5.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BOB' self.items = ZCZCBOBParser().parse(fixture, self.provider) self.assertEqual(self.items.get('slugline'), 'Legal: Causevic_BC6') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'A') self.assertEqual(self.items.get('headline'), 'Vic: GPS device to come off Vic teen ') self.assertEqual(self.items.get('anpa_take_key'), '(MELBOURNE)') self.assertEqual(self.items.get('subject')[0]['qcode'], '02000000') self.assertTrue(self.items.get('body_html').startswith('<p>A former Melbourne terror suspect no ' 'longer needs to wear')) self.assertEqual(self.items.get('place')[0].get('state'), 'Victoria') self.assertEqual(self.items.get('genre')[0].get('name'), 'Broadcast Script')
class ZCZCTestCase(TestCase): provider = {'name': 'test provder', 'provider': {}} validators = [ { 'schema': { 'headline': { 'required': True, 'maxlength': 64, 'empty': False, 'nullable': False, 'type': "string" }, 'slugline': { 'required': True, 'maxlength': 24, 'empty': False, 'nullable': False, 'type': "string" } }, 'type': 'text', 'act': 'publish', '_id': 'publish_text' }, { 'schema': { 'slugline': { 'required': True, 'maxlength': 30, 'empty': False, 'nullable': False, 'type': "string" } }, 'type': 'text', 'act': 'auto_publish', '_id': 'auto_publish_text' } ] vocab = [{'_id': 'locators', 'items': [{ "name": "VIC", "state": "Victoria", "group": "Australia", "qcode": "VIC", "country": "Australia", "is_active": True, "world_region": "Oceania"}, {"name": "QLD", "qcode": "QLD"}, {"name": "FED", "qcode": "FED"}]}, {'_id': 'genre', 'items': [{ "name": "Broadcast Script", "is_active": True, "qcode": "Broadcast Script"}, { "name": "Results (sport)", "is_active": True, "qcode": "Results (sport)"} ]}] def setUp(self): self.app.data.insert('validators', self.validators) self.app.data.insert('vocabularies', self.vocab) def test_default_format(self): filename = 'Standings__2014_14_635535729050675896.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'SOMETHING' self.items = ZCZCFeedParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'MOTOR: Collated results/standings after Sydney NRMA 500') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'T') self.assertEqual(self.items.get('subject')[0]['qcode'], '15039001') self.assertIn('versioncreated', self.items) def test_sports_results_format(self): filename = 'Standings__2014_14_635535729050675896.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'SOMETHING' self.items = ZCZCSportsResultsParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'MOTOR: Collated results/standings after Sydney NRMA 500') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'T') self.assertEqual(self.items.get('subject')[0]['qcode'], '15039001') self.assertEqual(self.items.get('genre')[0]['qcode'], 'Results (sport)') self.assertIn('versioncreated', self.items) def test_sports_results_preview_format(self): filename = 'AFL_FormGuide__636241349261119029.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'SOMETHING' self.items = ZCZCSportsResultsParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'AFL: AFL Round 23 preview panel') self.assertTrue(self.items.get('body_html').startswith('<p>MELBOURNE, March 3 AAP - Preview of ' 'AFL Round 23 matches (all times AEDT):</p>')) self.assertTrue('<br>Tip:' in self.items.get('body_html')) def test_medianet_format(self): filename = 'ED_841066_2_1.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'MNET' self.items = ZCZCMedianetParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Media Release: Australian Financial Security Authority') self.assertEqual(self.items.get('place')[0], {'qcode': 'FED', 'name': 'FED'}) self.assertEqual(self.items.get('subject')[0]['qcode'], '04000000') self.assertEqual(len(self.items.get('anpa_take_key')), 24) def test_medianet_investor_relations_format(self): filename = 'ED_867485_4_2.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'MNET' self.items = ZCZCMedianetParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'IRW News Release: Master Builders Australia') def test_pagemasters_format(self): filename = 'Darwin GR - Greys - Sun 11 Oct, 2015.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' self.items = ZCZCPMFParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Darwin Greyhound Fields Sunday') self.assertEqual(self.items.get('slugline'), 'Darwin Grey') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'r') self.assertEqual(self.items.get('subject')[0]['qcode'], '15082000') self.assertEqual(self.items.get('genre')[0]['name'], 'Results (sport)') def test_racing_format(self): filename = 'viflda004_7257.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), ' Racing.Com Park FIELDS Thursday') self.assertEqual(self.items.get('slugline'), ' Racing.Com Park FIELDS ') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001') def test_racing_format_2(self): filename = 'vifrc7_5254.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Wodonga Comment Saturday races 1-6') self.assertEqual(self.items.get('slugline'), 'Wodonga Comment') self.assertEqual(self.items.get('anpa_take_key'), 'Saturday races 1-6') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001') def test_racing_format_3(self): filename = 'vicomb004_8511.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Eagle Farm MARKET DAY') self.assertEqual(self.items.get('slugline'), 'Eagle Farm MARKET DAY') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001') def test_trot_tab_divs(self): filename = 'Wagga Trot VIC TAB DIVS 1-4 Friday.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' self.items = ZCZCPMFParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Wagga Trot VIC TAB DIVS 1-4 Friday') self.assertEqual(self.items.get('slugline'), 'Wagga Trot') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'r') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030003') self.assertEqual(self.items.get('genre')[0]['name'], 'Results (sport)') def test_leading_jockeys(self): filename = 'vinlpt_8390.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Leading jockeys (Sydney)') self.assertEqual(self.items.get('slugline'), 'Leading jockeys (Sydney)') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001') def test_weights(self): filename = 'viwhtn01_8594.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BRA' self.items = ZCZCRacingParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'STRADBROKE HANDICAP 1400M .=!') self.assertEqual(self.items.get('slugline'), 'STRADBROKE HANDICAP 1400') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'h') self.assertEqual(self.items.get('subject')[0]['qcode'], '15030001') def test_bob(self): filename = '1487e8f1-f7f5-40f5-8c0f-0eba3c2e162d.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BOB' self.items = ZCZCBOBParser().parse(fixture, self.provider) self.assertEqual(self.items.get('slugline'), 'Legionella_BC1') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'A') self.assertEqual(self.items.get('headline'), 'QLD: Legionella found in Qld hospital') self.assertEqual(self.items.get('anpa_take_key'), '(BRISBANE)') self.assertEqual(self.items.get('subject')[0]['qcode'], '07000000') self.assertTrue(self.items.get('body_html').startswith('<p>Legionella bacteria has been found in a regional')) def test_bob_empty_header_line(self): filename = '612fa1dc-c476-425d-8c80-d40bdc9cc1d5.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'BOB' self.items = ZCZCBOBParser().parse(fixture, self.provider) self.assertEqual(self.items.get('slugline'), 'Legal: Causevic_BC6') self.assertEqual(self.items.get('anpa_category')[0]['qcode'], 'A') self.assertEqual(self.items.get('headline'), 'Vic: GPS device to come off Vic teen ') self.assertEqual(self.items.get('anpa_take_key'), '(MELBOURNE)') self.assertEqual(self.items.get('subject')[0]['qcode'], '02000000') self.assertTrue(self.items.get('body_html').startswith('<p>A former Melbourne terror suspect no ' 'longer needs to wear')) self.assertEqual(self.items.get('place')[0].get('state'), 'Victoria') self.assertEqual(self.items.get('genre')[0].get('name'), 'Broadcast Script') def test_greyhound_divs(self): filename = 'Warragul Greyhound NSW TAB DIVS 1-11 Thursday.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' self.items = ZCZCPMFParser().parse(fixture, self.provider) self.assertEqual(self.items.get('headline'), 'Warragul Greyhound NSW TAB DIVS 1-11 Thursday') self.assertEqual(self.items.get('slugline'), 'Warragul Greys') self.assertEqual(self.items.get('anpa_take_key'), 'NSW TAB DIVS 1-11') self.assertEqual(self.items.get('genre')[0]['name'], 'Results (sport)') def test_pagemasters_market(self): filename = 'Caulfield RA - Betting - Sat 11 Feb, 2017.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' parser = ZCZCPMFParser() self.items = parser.parse(fixture, self.provider) parser.post_process_item(self.items, self.provider) self.assertEqual(self.items.get('slugline'), 'Caulfield Market') self.assertEqual(self.items.get('anpa_take_key'), 'Saturday') self.assertEqual(self.items.get('headline'), 'Caulfield Market Saturday') def test_truncate_pagemasters_slugline(self): filename = 'National Top Ten By Volume at Close - March 13.tst' dirname = os.path.dirname(os.path.realpath(__file__)) fixture = os.path.normpath(os.path.join(dirname, '../fixtures', filename)) self.provider['source'] = 'PMF' parser = ZCZCPMFParser() self.items = parser.parse(fixture, self.provider) parser.post_process_item(self.items, self.provider) self.assertEqual(self.items.get('slugline'), 'National Top Ten By Volume at ')