def test_compare_pq_with_reference_eval(self): sample_data_dir = os.path.join(_TEST_DIR) gt_json_file = os.path.join(sample_data_dir, 'coco_gt.json') gt_folder = os.path.join(sample_data_dir, 'coco_gt') pred_json_file = os.path.join(sample_data_dir, 'coco_pred.json') pred_folder = os.path.join(sample_data_dir, 'coco_pred') panopticapi_results = panopticapi_eval.pq_compute( gt_json_file, pred_json_file, gt_folder, pred_folder) deeplab_results = eval_coco_format.eval_coco_format( gt_json_file, pred_json_file, gt_folder, pred_folder, metric='pq', num_categories=7, ignored_label=0, max_instances_per_category=256, intersection_offset=(256 * 256)) self.assertCountEqual(deeplab_results.keys(), ['All', 'Things', 'Stuff']) for cat_group in ['All', 'Things', 'Stuff']: self.assertCountEqual(deeplab_results[cat_group], ['pq', 'sq', 'rq', 'n']) for metric in ['pq', 'sq', 'rq', 'n']: self.assertAlmostEqual(deeplab_results[cat_group][metric], panopticapi_results[cat_group][metric])