Example #1
0
    def test_synoname_dist_abs(self):
        """Test abydos.distance.Synoname.dist_abs."""
        # Base cases
        self.assertEqual(self.cmp.dist_abs('', ''), 1)
        self.assertEqual(Synoname(tests=['exact']).dist_abs('', ''), 1)
        self.assertEqual(Synoname(tests=[]).dist_abs('', ''), 13)
        self.assertEqual(
            Synoname(tests=['nonsense-test']).dist_abs('', ''), 13
        )

        # Test input formats
        self.assertEqual(
            self.cmp.dist_abs(
                ('Brueghel II (the Younger)', 'Pieter', 'Workshop of'),
                ('Brueghel II (the Younger)', 'Pieter', 'Workshop of'),
            ),
            1,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                'Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                'Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            1,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                '22#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                '44#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            1,
        )

        # approx_c tests
        self.assertEqual(
            self.cmp.dist_abs(
                (
                    'Master of Brueghel II (the Younger)',
                    'Pieter',
                    'Workshop of',
                ),
                ('Brueghel I (the Elder)', 'Pieter', 'Workshop of'),
            ),
            13,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                ('Master of Brueghel II', 'Pieter', 'Workshop of'),
                ('Master known as the Brueghel II', 'Pieter', 'Workshop of'),
            ),
            10,
        )
class SynonameTestCases(unittest.TestCase):
    """Test Synoname functions.

    abydos.distance.Synoname
    """

    cmp = Synoname()

    def test_synoname_strip_punct(self):
        """Test abydos.distance.Synoname._synoname_strip_punct."""
        # Base case
        self.assertEqual(self.cmp._synoname_strip_punct(''), '')  # noqa: SF01

        self.assertEqual(
            self.cmp._synoname_strip_punct('abcdefg'), 'abcdefg'  # noqa: SF01
        )
        self.assertEqual(
            self.cmp._synoname_strip_punct("a'b-c,d!e:f%g"),  # noqa: SF01
            'abcdefg',
        )

    def test_synoname_word_approximation(self):
        """Test abydos.distance.Synoname._synoname_word_approximation."""
        # Base case
        self.assertEqual(
            self.cmp._synoname_word_approximation('', ''), 0  # noqa: SF01
        )

        self.assertEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'di Domenico di Bonaventura',
                'di Tomme di Nuto',
                'Cosimo',
                'Luca',
            ),
            0.4,
        )
        self.assertEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'Antonello da Messina',
                'Messina',
                '',
                'Antonello da',
                {
                    'gen_conflict': False,
                    'roman_conflict': False,
                    'src_specials': [(35, 'b'), (35, 'c')],
                    'tar_specials': [(35, 'b'), (35, 'c')],
                },
            ),
            0,
        )
        self.assertEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'louis ii',
                'louis ii',
                'sr jean',
                'sr  pierre',
                {
                    'gen_conflict': False,
                    'roman_conflict': False,
                    'src_specials': [(49, 'b'), (68, 'd'), (121, 'b')],
                    'tar_specials': [(49, 'b'), (68, 'd'), (121, 'b')],
                },
            ),
            0,
        )
        self.assertEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'louis ii',
                'louis ii',
                'il giovane',
                'sr cadet',
                {
                    'gen_conflict': False,
                    'roman_conflict': False,
                    'src_specials': [
                        (46, 'a'),
                        (49, 'b'),
                        (52, 'a'),
                        (68, 'd'),
                    ],
                    'tar_specials': [
                        (8, 'a'),
                        (49, 'b'),
                        (68, 'd'),
                        (121, 'a'),
                    ],
                },
            ),
            1,
        )
        self.assertAlmostEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'louis ii',
                'louis ii',
                'ste.-geo ste.',
                'ste.-jo ste.',
                {
                    'gen_conflict': False,
                    'roman_conflict': False,
                    'src_specials': [
                        (49, 'b'),
                        (68, 'd'),
                        (127, 'b'),
                        (127, 'X'),
                    ],
                    'tar_specials': [
                        (49, 'b'),
                        (68, 'd'),
                        (127, 'b'),
                        (127, 'X'),
                    ],
                },
            ),
            2 / 3,
        )
        self.assertAlmostEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'louis ii',
                'louis',
                'ste.-geo ste.',
                '',
                {
                    'gen_conflict': False,
                    'roman_conflict': False,
                    'src_specials': [
                        (49, 'b'),
                        (68, 'd'),
                        (127, 'b'),
                        (127, 'X'),
                    ],
                    'tar_specials': [],
                },
            ),
            0,
        )
        self.assertAlmostEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'lou ii', 'louis', 'louis iv', 'ste.', {}
            ),
            0,
        )
        self.assertEqual(
            self.cmp._synoname_word_approximation(  # noqa: SF01
                'ren',
                'loren ste.',
                '',
                '',
                {
                    'tar_specials': [(68, 'd'), (127, 'X')],
                    'src_specials': [(0, '')],
                },
            ),
            1,
        )

    def test_synoname_dist_abs(self):
        """Test abydos.distance.Synoname.dist_abs."""
        # Base cases
        self.assertEqual(self.cmp.dist_abs('', ''), 1)
        self.assertEqual(Synoname(tests=['exact']).dist_abs('', ''), 1)
        self.assertEqual(Synoname(tests=[]).dist_abs('', ''), 13)
        self.assertEqual(
            Synoname(tests=['nonsense-test']).dist_abs('', ''), 13
        )
        self.assertEqual(Synoname(ret_name=True).dist_abs('', ''), 'exact')

        # Test input formats
        self.assertEqual(
            self.cmp.dist_abs(
                ('Brueghel II (the Younger)', 'Pieter', 'Workshop of'),
                ('Brueghel II (the Younger)', 'Pieter', 'Workshop of'),
            ),
            1,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                'Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                'Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            1,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                '22#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                '44#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            1,
        )

        # approx_c tests
        self.assertEqual(
            self.cmp.dist_abs(
                (
                    'Master of Brueghel II (the Younger)',
                    'Pieter',
                    'Workshop of',
                ),
                ('Brueghel I (the Elder)', 'Pieter', 'Workshop of'),
            ),
            13,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                ('Master of Brueghel II', 'Pieter', 'Workshop of'),
                ('Master known as the Brueghel II', 'Pieter', 'Workshop of'),
            ),
            10,
        )

        # Types 1-12
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Brueghel', 'Pieter', '')
            ),
            'exact',
        )

        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel II', 'Pieter', ''), ('Brueghel I', 'Pieter', '')
            ),
            'no_match',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Breghel', 'Pieter', ''), ('Brueghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Breghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Piter', ''), ('Brueghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Brueghel', 'Piter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brughel', 'Pieter', ''), ('Breghel', 'Pieter', '')
            ),
            'substitution',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Breughel', 'Peter', ''), ('Breughel', 'Piter', '')
            ),
            'substitution',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Breughel', 'Pieter', '')
            ),
            'transposition',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Peiter', ''), ('Brueghel', 'Pieter', '')
            ),
            'transposition',
        )

        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel:', 'Pieter', ''), ('Brueghel', 'Pi-eter', '')
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel,', 'Pieter', ''), ('Brueghel', 'Pieter...', '')
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Seu rat', 'George Pierre', ''),
                ('Seu-rat', 'George-Pierre', ''),
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Picasso', '', ''), ('Picasso', 'Pablo', '')
            ),
            'no_first',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R.', ''), ('Pereira', 'Irene Rice', '')
            ),
            'initials',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I.', ''), ('Pereira', 'Irene Rice', '')
            ),
            'initials',
        )
        self.assertNotEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R.', ''), ('Pereira', 'I. Smith', '')
            ),
            'initials',
        )
        self.assertNotEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R. S.', ''), ('Pereira', 'I. S. R.', '')
            ),
            'initials',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('de Goya', 'Francisco', ''),
                ('de Goya y Lucientes', 'Francisco', ''),
            ),
            'extension',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Seurat', 'George', ''), ('Seurat', 'George-Pierre', '')
            ),
            'extension',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Gericault', 'Theodore', ''),
                ('Gericault', 'Jean Louis Andre Theodore', ''),
            ),
            'inclusion',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Dore', 'Gustave', ''),
                ('Dore', 'Paul Gustave Louis Christophe', ''),
            ),
            'inclusion',
        )

        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Rosetti', 'Dante Gabriel', ''),
                ('Rosetti', 'Gabriel Charles Dante', ''),
            ),
            'word_approx',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('di Domenico di Bonaventura', 'Cosimo', ''),
                ('di Tomme di Nuto', 'Luca', ''),
            ),
            'no_match',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R.', ''), ('Pereira', 'I. Smith', '')
            ),
            'word_approx',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Antonello da Messina', '', ''),
                ('Messina', 'Antonello da', ''),
            ),
            'confusions',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pietter', ''), ('Bruegghel', 'Pieter', '')
            ),
            'char_approx',
        )

        # Test wrapper
        self.assertEqual(
            synoname(
                ('Master of Brueghel II', 'Pieter', 'Workshop of'),
                ('Master known as the Brueghel II', 'Pieter', 'Workshop of'),
            ),
            10,
        )

    def test_synoname_dist(self):
        """Test abydos.distance.Synoname.dist."""
        # Base cases
        self.assertAlmostEqual(self.cmp.dist('', ''), 1 / 14)
        self.assertAlmostEqual(
            self.cmp.dist(
                '22#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                '44#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            1 / 14,
        )
        self.assertAlmostEqual(
            self.cmp.dist(
                (
                    'Master of Brueghel II (the Younger)',
                    'Pieter',
                    'Workshop of',
                ),
                ('Brueghel I (the Elder)', 'Pieter', 'Workshop of'),
            ),
            13 / 14,
        )
        self.assertAlmostEqual(
            self.cmp.dist(
                ('Master of Brueghel II', 'Pieter', 'Workshop of'),
                ('Master known as the Brueghel II', 'Pieter', 'Workshop of'),
            ),
            10 / 14,
        )

    def test_synoname_sim(self):
        """Test abydos.distance.Synoname.sim."""
        # Base cases
        self.assertAlmostEqual(self.cmp.sim('', ''), 13 / 14)
        self.assertAlmostEqual(
            self.cmp.sim(
                '22#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                '44#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            13 / 14,
        )
        self.assertAlmostEqual(
            self.cmp.sim(
                (
                    'Master of Brueghel II (the Younger)',
                    'Pieter',
                    'Workshop of',
                ),
                ('Brueghel I (the Elder)', 'Pieter', 'Workshop of'),
            ),
            1 / 14,
        )
        self.assertAlmostEqual(
            self.cmp.sim(
                ('Master of Brueghel II', 'Pieter', 'Workshop of'),
                ('Master known as the Brueghel II', 'Pieter', 'Workshop of'),
            ),
            4 / 14,
        )
    def test_synoname_dist_abs(self):
        """Test abydos.distance.Synoname.dist_abs."""
        # Base cases
        self.assertEqual(self.cmp.dist_abs('', ''), 1)
        self.assertEqual(Synoname(tests=['exact']).dist_abs('', ''), 1)
        self.assertEqual(Synoname(tests=[]).dist_abs('', ''), 13)
        self.assertEqual(
            Synoname(tests=['nonsense-test']).dist_abs('', ''), 13
        )
        self.assertEqual(Synoname(ret_name=True).dist_abs('', ''), 'exact')

        # Test input formats
        self.assertEqual(
            self.cmp.dist_abs(
                ('Brueghel II (the Younger)', 'Pieter', 'Workshop of'),
                ('Brueghel II (the Younger)', 'Pieter', 'Workshop of'),
            ),
            1,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                'Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                'Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            1,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                '22#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
                '44#Brueghel II (the Younger)#Pieter#' + 'Workshop of',
            ),
            1,
        )

        # approx_c tests
        self.assertEqual(
            self.cmp.dist_abs(
                (
                    'Master of Brueghel II (the Younger)',
                    'Pieter',
                    'Workshop of',
                ),
                ('Brueghel I (the Elder)', 'Pieter', 'Workshop of'),
            ),
            13,
        )
        self.assertEqual(
            self.cmp.dist_abs(
                ('Master of Brueghel II', 'Pieter', 'Workshop of'),
                ('Master known as the Brueghel II', 'Pieter', 'Workshop of'),
            ),
            10,
        )

        # Types 1-12
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Brueghel', 'Pieter', '')
            ),
            'exact',
        )

        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel II', 'Pieter', ''), ('Brueghel I', 'Pieter', '')
            ),
            'no_match',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Breghel', 'Pieter', ''), ('Brueghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Breghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Piter', ''), ('Brueghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Brueghel', 'Piter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brughel', 'Pieter', ''), ('Breghel', 'Pieter', '')
            ),
            'substitution',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Breughel', 'Peter', ''), ('Breughel', 'Piter', '')
            ),
            'substitution',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pieter', ''), ('Breughel', 'Pieter', '')
            ),
            'transposition',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Peiter', ''), ('Brueghel', 'Pieter', '')
            ),
            'transposition',
        )

        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel:', 'Pieter', ''), ('Brueghel', 'Pi-eter', '')
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel,', 'Pieter', ''), ('Brueghel', 'Pieter...', '')
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Seu rat', 'George Pierre', ''),
                ('Seu-rat', 'George-Pierre', ''),
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Picasso', '', ''), ('Picasso', 'Pablo', '')
            ),
            'no_first',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R.', ''), ('Pereira', 'Irene Rice', '')
            ),
            'initials',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I.', ''), ('Pereira', 'Irene Rice', '')
            ),
            'initials',
        )
        self.assertNotEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R.', ''), ('Pereira', 'I. Smith', '')
            ),
            'initials',
        )
        self.assertNotEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R. S.', ''), ('Pereira', 'I. S. R.', '')
            ),
            'initials',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('de Goya', 'Francisco', ''),
                ('de Goya y Lucientes', 'Francisco', ''),
            ),
            'extension',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Seurat', 'George', ''), ('Seurat', 'George-Pierre', '')
            ),
            'extension',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Gericault', 'Theodore', ''),
                ('Gericault', 'Jean Louis Andre Theodore', ''),
            ),
            'inclusion',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Dore', 'Gustave', ''),
                ('Dore', 'Paul Gustave Louis Christophe', ''),
            ),
            'inclusion',
        )

        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Rosetti', 'Dante Gabriel', ''),
                ('Rosetti', 'Gabriel Charles Dante', ''),
            ),
            'word_approx',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('di Domenico di Bonaventura', 'Cosimo', ''),
                ('di Tomme di Nuto', 'Luca', ''),
            ),
            'no_match',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Pereira', 'I. R.', ''), ('Pereira', 'I. Smith', '')
            ),
            'word_approx',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Antonello da Messina', '', ''),
                ('Messina', 'Antonello da', ''),
            ),
            'confusions',
        )
        self.assertEqual(
            Synoname(ret_name=True).dist_abs(
                ('Brueghel', 'Pietter', ''), ('Bruegghel', 'Pieter', '')
            ),
            'char_approx',
        )

        # Test wrapper
        self.assertEqual(
            synoname(
                ('Master of Brueghel II', 'Pieter', 'Workshop of'),
                ('Master known as the Brueghel II', 'Pieter', 'Workshop of'),
            ),
            10,
        )
Example #4
0
    def test_synoname_sim_type(self):
        """Test abydos.distance.Synoname.sim_type."""
        self.assertEqual(self.cmp.sim_type('', ''), 1)
        self.assertEqual(Synoname(tests=['exact']).sim_type('', ''), 1)
        self.assertEqual(Synoname(tests=[]).sim_type('', ''), 13)
        self.assertEqual(
            Synoname(tests=['nonsense-test']).sim_type('', ''), 13
        )
        self.assertEqual(Synoname(ret_name=True).sim_type('', ''), 'exact')

        # Types 1-12
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel', 'Pieter', ''), ('Brueghel', 'Pieter', '')
            ),
            'exact',
        )

        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel II', 'Pieter', ''), ('Brueghel I', 'Pieter', '')
            ),
            'no_match',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Breghel', 'Pieter', ''), ('Brueghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel', 'Pieter', ''), ('Breghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel', 'Piter', ''), ('Brueghel', 'Pieter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel', 'Pieter', ''), ('Brueghel', 'Piter', '')
            ),
            'omission',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brughel', 'Pieter', ''), ('Breghel', 'Pieter', '')
            ),
            'substitution',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Breughel', 'Peter', ''), ('Breughel', 'Piter', '')
            ),
            'substitution',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel', 'Pieter', ''), ('Breughel', 'Pieter', '')
            ),
            'transposition',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel', 'Peiter', ''), ('Brueghel', 'Pieter', '')
            ),
            'transposition',
        )

        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel:', 'Pieter', ''), ('Brueghel', 'Pi-eter', '')
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel,', 'Pieter', ''), ('Brueghel', 'Pieter...', '')
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Seu rat', 'George Pierre', ''),
                ('Seu-rat', 'George-Pierre', ''),
            ),
            'punctuation',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Picasso', '', ''), ('Picasso', 'Pablo', '')
            ),
            'no_first',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Pereira', 'I. R.', ''), ('Pereira', 'Irene Rice', '')
            ),
            'initials',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Pereira', 'I.', ''), ('Pereira', 'Irene Rice', '')
            ),
            'initials',
        )
        self.assertNotEqual(
            Synoname(ret_name=True).sim_type(
                ('Pereira', 'I. R.', ''), ('Pereira', 'I. Smith', '')
            ),
            'initials',
        )
        self.assertNotEqual(
            Synoname(ret_name=True).sim_type(
                ('Pereira', 'I. R. S.', ''), ('Pereira', 'I. S. R.', '')
            ),
            'initials',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('de Goya', 'Francisco', ''),
                ('de Goya y Lucientes', 'Francisco', ''),
            ),
            'extension',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Seurat', 'George', ''), ('Seurat', 'George-Pierre', '')
            ),
            'extension',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Gericault', 'Theodore', ''),
                ('Gericault', 'Jean Louis Andre Theodore', ''),
            ),
            'inclusion',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Dore', 'Gustave', ''),
                ('Dore', 'Paul Gustave Louis Christophe', ''),
            ),
            'inclusion',
        )

        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Rosetti', 'Dante Gabriel', ''),
                ('Rosetti', 'Gabriel Charles Dante', ''),
            ),
            'word_approx',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('di Domenico di Bonaventura', 'Cosimo', ''),
                ('di Tomme di Nuto', 'Luca', ''),
            ),
            'no_match',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Pereira', 'I. R.', ''), ('Pereira', 'I. Smith', '')
            ),
            'word_approx',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Antonello da Messina', '', ''),
                ('Messina', 'Antonello da', ''),
            ),
            'confusions',
        )
        self.assertEqual(
            Synoname(ret_name=True).sim_type(
                ('Brueghel', 'Pietter', ''), ('Bruegghel', 'Pieter', '')
            ),
            'char_approx',
        )