Пример #1
0
 def test_extract_ids(self):
     Node = namedtuple("Node", ["roles", "token", "children"])
     node1 = Node([SIMPLE_IDENTIFIER], 1, [])
     node2 = Node([], 2, [])
     node3 = Node([SIMPLE_IDENTIFIER], 3, [node1, node2])
     node4 = Node([SIMPLE_IDENTIFIER], 4, [])
     root = Node([], 5, [node3, node4])
     repo2 = Repo2Coocc(linguist=tests.ENRY, timeout=600)
     self.assertEqual(list(repo2._extract_ids(root)), [4, 3, 1])
Пример #2
0
 def test_obj(self):
     basedir = os.path.dirname(__file__)
     repo2 = Repo2Coocc(linguist=tests.ENRY, timeout=600)
     coocc = repo2.convert_repository(os.path.join(basedir, "..", ".."))
     self.assertIsInstance(coocc, tuple)
     self.assertEqual(len(coocc), 2)
     self.assertIn("document", coocc[0])
     self.assertIsInstance(coocc[1], coo_matrix)
     self.assertEqual(coocc[1].shape, (len(coocc[0]), ) * 2)
     self.assertGreater(coocc[1].getnnz(), 20000)
Пример #3
0
    def test_zero_tokens(self):
        def skip_uast(root, word2ind, dok_mat):
            pass

        repo2 = Repo2Coocc(linguist=tests.ENRY, timeout=600)
        repo2._traverse_uast = skip_uast
        basedir = os.path.dirname(__file__)
        coocc = repo2.convert_repository(os.path.join(basedir, "..", ".."))
        self.assertEqual(coocc[0], [])
        self.assertEqual(coocc[1].shape, (0, 0))
        self.assertEqual(coocc[1].nnz, 0)
Пример #4
0
 def test_linguist(self):
     # If this test fails, check execution permissions for provided paths.
     with self.assertRaises(FileNotFoundError):
         Repo2Coocc(linguist="xxx", timeout=600)
     with self.assertRaises(FileNotFoundError):
         Repo2Coocc(linguist=__file__, timeout=600)