class BagTestCases(unittest.TestCase): """Test bag similarity functions. abydos.distance.Bag """ cmp = Bag() def test_bag_dist_abs(self): """Test abydos.distance.Bag.dist_abs.""" self.assertEqual(self.cmp.dist_abs('', ''), 0) self.assertEqual(self.cmp.dist_abs('nelson', ''), 6) self.assertEqual(self.cmp.dist_abs('', 'neilsen'), 7) self.assertEqual(self.cmp.dist_abs('ab', 'a'), 1) self.assertEqual(self.cmp.dist_abs('ab', 'c'), 2) self.assertEqual(self.cmp.dist_abs('nelson', 'neilsen'), 2) self.assertEqual(self.cmp.dist_abs('neilsen', 'nelson'), 2) self.assertEqual(self.cmp.dist_abs('niall', 'neal'), 2) self.assertEqual(self.cmp.dist_abs('aluminum', 'Catalan'), 5) self.assertEqual(self.cmp.dist_abs('abcdefg', 'hijklm'), 7) self.assertEqual(self.cmp.dist_abs('abcdefg', 'hijklmno'), 8) # Test wrapper self.assertEqual(bag('nelson', 'neilsen'), 2) def test_bag_sim(self): """Test abydos.distance.Bag.sim.""" self.assertEqual(self.cmp.sim('', ''), 1) self.assertEqual(self.cmp.sim('nelson', ''), 0) self.assertEqual(self.cmp.sim('', 'neilsen'), 0) self.assertEqual(self.cmp.sim('ab', 'a'), 0.5) self.assertEqual(self.cmp.sim('ab', 'c'), 0) self.assertAlmostEqual(self.cmp.sim('nelson', 'neilsen'), 5 / 7) self.assertAlmostEqual(self.cmp.sim('neilsen', 'nelson'), 5 / 7) self.assertAlmostEqual(self.cmp.sim('niall', 'neal'), 3 / 5) self.assertAlmostEqual(self.cmp.sim('aluminum', 'Catalan'), 3 / 8) self.assertEqual(self.cmp.sim('abcdefg', 'hijklm'), 0) self.assertEqual(self.cmp.sim('abcdefg', 'hijklmno'), 0) self.assertEqual(Bag(tokenizer=SAPSTokenizer()).sim('DNA', 'RNA'), 0.5) # Test wrapper self.assertAlmostEqual(sim_bag('nelson', 'neilsen'), 5 / 7) def test_bag_dist(self): """Test abydos.distance.Bag.dist.""" self.assertEqual(self.cmp.dist('', ''), 0) self.assertEqual(self.cmp.dist('nelson', ''), 1) self.assertEqual(self.cmp.dist('', 'neilsen'), 1) self.assertEqual(self.cmp.dist('ab', 'a'), 0.5) self.assertEqual(self.cmp.dist('ab', 'c'), 1) self.assertAlmostEqual(self.cmp.dist('nelson', 'neilsen'), 2 / 7) self.assertAlmostEqual(self.cmp.dist('neilsen', 'nelson'), 2 / 7) self.assertAlmostEqual(self.cmp.dist('niall', 'neal'), 2 / 5) self.assertAlmostEqual(self.cmp.dist('aluminum', 'Catalan'), 5 / 8) self.assertEqual(self.cmp.dist('abcdefg', 'hijklm'), 1) self.assertEqual(self.cmp.dist('abcdefg', 'hijklmno'), 1) # Test wrapper self.assertAlmostEqual(dist_bag('nelson', 'neilsen'), 2 / 7)
def test_bag_sim(self): """Test abydos.distance.Bag.sim.""" self.assertEqual(self.cmp.sim('', ''), 1) self.assertEqual(self.cmp.sim('nelson', ''), 0) self.assertEqual(self.cmp.sim('', 'neilsen'), 0) self.assertEqual(self.cmp.sim('ab', 'a'), 0.5) self.assertEqual(self.cmp.sim('ab', 'c'), 0) self.assertAlmostEqual(self.cmp.sim('nelson', 'neilsen'), 5 / 7) self.assertAlmostEqual(self.cmp.sim('neilsen', 'nelson'), 5 / 7) self.assertAlmostEqual(self.cmp.sim('niall', 'neal'), 3 / 5) self.assertAlmostEqual(self.cmp.sim('aluminum', 'Catalan'), 3 / 8) self.assertEqual(self.cmp.sim('abcdefg', 'hijklm'), 0) self.assertEqual(self.cmp.sim('abcdefg', 'hijklmno'), 0) self.assertEqual(Bag(tokenizer=SAPSTokenizer()).sim('DNA', 'RNA'), 0.5)