Ejemplo n.º 1
0
class BagTestCases(unittest.TestCase):
    """Test bag similarity functions.

    abydos.distance.Bag
    """

    cmp = Bag()

    def test_bag_dist_abs(self):
        """Test abydos.distance.Bag.dist_abs."""
        self.assertEqual(self.cmp.dist_abs('', ''), 0)
        self.assertEqual(self.cmp.dist_abs('nelson', ''), 6)
        self.assertEqual(self.cmp.dist_abs('', 'neilsen'), 7)
        self.assertEqual(self.cmp.dist_abs('ab', 'a'), 1)
        self.assertEqual(self.cmp.dist_abs('ab', 'c'), 2)
        self.assertEqual(self.cmp.dist_abs('nelson', 'neilsen'), 2)
        self.assertEqual(self.cmp.dist_abs('neilsen', 'nelson'), 2)
        self.assertEqual(self.cmp.dist_abs('niall', 'neal'), 2)
        self.assertEqual(self.cmp.dist_abs('aluminum', 'Catalan'), 5)
        self.assertEqual(self.cmp.dist_abs('abcdefg', 'hijklm'), 7)
        self.assertEqual(self.cmp.dist_abs('abcdefg', 'hijklmno'), 8)

        # Test wrapper
        self.assertEqual(bag('nelson', 'neilsen'), 2)

    def test_bag_sim(self):
        """Test abydos.distance.Bag.sim."""
        self.assertEqual(self.cmp.sim('', ''), 1)
        self.assertEqual(self.cmp.sim('nelson', ''), 0)
        self.assertEqual(self.cmp.sim('', 'neilsen'), 0)
        self.assertEqual(self.cmp.sim('ab', 'a'), 0.5)
        self.assertEqual(self.cmp.sim('ab', 'c'), 0)
        self.assertAlmostEqual(self.cmp.sim('nelson', 'neilsen'), 5 / 7)
        self.assertAlmostEqual(self.cmp.sim('neilsen', 'nelson'), 5 / 7)
        self.assertAlmostEqual(self.cmp.sim('niall', 'neal'), 3 / 5)
        self.assertAlmostEqual(self.cmp.sim('aluminum', 'Catalan'), 3 / 8)
        self.assertEqual(self.cmp.sim('abcdefg', 'hijklm'), 0)
        self.assertEqual(self.cmp.sim('abcdefg', 'hijklmno'), 0)

        self.assertEqual(Bag(tokenizer=SAPSTokenizer()).sim('DNA', 'RNA'), 0.5)

        # Test wrapper
        self.assertAlmostEqual(sim_bag('nelson', 'neilsen'), 5 / 7)

    def test_bag_dist(self):
        """Test abydos.distance.Bag.dist."""
        self.assertEqual(self.cmp.dist('', ''), 0)
        self.assertEqual(self.cmp.dist('nelson', ''), 1)
        self.assertEqual(self.cmp.dist('', 'neilsen'), 1)
        self.assertEqual(self.cmp.dist('ab', 'a'), 0.5)
        self.assertEqual(self.cmp.dist('ab', 'c'), 1)
        self.assertAlmostEqual(self.cmp.dist('nelson', 'neilsen'), 2 / 7)
        self.assertAlmostEqual(self.cmp.dist('neilsen', 'nelson'), 2 / 7)
        self.assertAlmostEqual(self.cmp.dist('niall', 'neal'), 2 / 5)
        self.assertAlmostEqual(self.cmp.dist('aluminum', 'Catalan'), 5 / 8)
        self.assertEqual(self.cmp.dist('abcdefg', 'hijklm'), 1)
        self.assertEqual(self.cmp.dist('abcdefg', 'hijklmno'), 1)

        # Test wrapper
        self.assertAlmostEqual(dist_bag('nelson', 'neilsen'), 2 / 7)
Ejemplo n.º 2
0
    def test_bag_sim(self):
        """Test abydos.distance.Bag.sim."""
        self.assertEqual(self.cmp.sim('', ''), 1)
        self.assertEqual(self.cmp.sim('nelson', ''), 0)
        self.assertEqual(self.cmp.sim('', 'neilsen'), 0)
        self.assertEqual(self.cmp.sim('ab', 'a'), 0.5)
        self.assertEqual(self.cmp.sim('ab', 'c'), 0)
        self.assertAlmostEqual(self.cmp.sim('nelson', 'neilsen'), 5 / 7)
        self.assertAlmostEqual(self.cmp.sim('neilsen', 'nelson'), 5 / 7)
        self.assertAlmostEqual(self.cmp.sim('niall', 'neal'), 3 / 5)
        self.assertAlmostEqual(self.cmp.sim('aluminum', 'Catalan'), 3 / 8)
        self.assertEqual(self.cmp.sim('abcdefg', 'hijklm'), 0)
        self.assertEqual(self.cmp.sim('abcdefg', 'hijklmno'), 0)

        self.assertEqual(Bag(tokenizer=SAPSTokenizer()).sim('DNA', 'RNA'), 0.5)