def test_matrix_row_to_lists(self): dtm = self.dtm N = sum(dtm[0]) WS, DS = utils.matrix_to_lists(dtm) WS_row, DS_row = utils.matrix_to_lists(np.atleast_2d(dtm[0])) np.testing.assert_array_equal(WS_row, WS[:N]) np.testing.assert_array_equal(DS_row, DS[:N])
def test_matrix_row_to_lists_sparse(self): dtm = self.dtm_sparse N = dtm[0].sum() WS, DS = utils.matrix_to_lists(dtm) WS_row, DS_row = utils.matrix_to_lists(dtm[0]) np.testing.assert_array_equal(WS_row, WS[:N]) np.testing.assert_array_equal(DS_row, DS[:N])
def test_matrix_rows_to_lists_sparse(self): dtm = self.dtm_sparse rows = dtm[0:2] N = rows.sum() WS, DS = utils.matrix_to_lists(dtm) WS_rows, DS_rows = utils.matrix_to_lists(rows) np.testing.assert_array_equal(WS_rows, WS[:N]) np.testing.assert_array_equal(DS_rows, DS[:N])
def test_matrix_to_lists(self): dtm, D, N_WORDS_PER_DOC = self.dtm, self.D, self.N_WORDS_PER_DOC N_BY_D, N_BY_W = self.N_BY_D, self.N_BY_W WS, DS = utils.matrix_to_lists(dtm) self.assertEqual(len(WS), D * N_WORDS_PER_DOC) self.assertEqual(len(WS), len(DS)) self.assertEqual(dtm.shape, (max(DS) + 1, max(WS) + 1)) self.assertTrue(all(DS == sorted(DS))) self.assertTrue(np.all(np.bincount(DS) == N_BY_D)) self.assertTrue(np.all(np.bincount(WS) == N_BY_W))
def test_lists_to_matrix(self): dtm = self.dtm WS, DS = utils.matrix_to_lists(dtm) dtm_new = utils.lists_to_matrix(WS, DS) self.assertTrue(np.all(dtm == dtm_new))