コード例 #1
0
ファイル: test_fs.py プロジェクト: becxer/pytrain
    def test_fs_csv_loader(self):
        sample_data = "sample_data/iris/iris.csv"
        self.tlog("loading matrix => " + sample_data)

        dmat_train, dlabel_train, dmat_test, dlabel_test \
            = fs.csv_loader(sample_data, 0.2)

        self.tlog('iris train data size : ' + str(len(dmat_train)))
        self.tlog('iris test data size : ' + str(len(dmat_test)))

        self.set_global_value('iris_mat_train', dmat_train)
        self.set_global_value('iris_label_train', dlabel_train)
        self.set_global_value('iris_mat_test', dmat_test)
        self.set_global_value('iris_label_test', dlabel_test)
コード例 #2
0
    def test_fs_csv_loader(self):
        sample_data = "sample_data/iris/iris.csv"
        self.tlog("loading matrix => " + sample_data)

        dmat_train, dlabel_train, dmat_test, dlabel_test \
            = fs.csv_loader(sample_data, 0.2)

        self.tlog('iris train data size : ' + str(len(dmat_train)))
        self.tlog('iris test data size : ' + str(len(dmat_test)))

        self.set_global_value('iris_mat_train', dmat_train)
        self.set_global_value('iris_label_train', dlabel_train)
        self.set_global_value('iris_mat_test', dmat_test)
        self.set_global_value('iris_label_test', dlabel_test)
コード例 #3
0
def load_mnist(path=".", dataset="training", one_hot=False):
    data_path = download_data(path, "mnist")
    train_data = os.path.join(data_path, "MNIST_train.small.csv")
    dmat_train, dlabel_train = fs.csv_loader(train_data, 0)
    test_data = os.path.join(data_path, "MNIST_test.small.csv")
    dmat_test, dlabel_test = fs.csv_loader(test_data, 0)
    dmat_train = map(lambda row: map(float, row), dmat_train)
    dmat_test = map(lambda row: map(float, row), dmat_test)
    if one_hot:
        one_hot_label = map(list, list(np.eye(10)))
        temp_dlabel_train = []
        temp_dlabel_test = []
        for l in dlabel_train:
            temp_dlabel_train.append(one_hot_label[int(l)])
        for l in dlabel_test:
            temp_dlabel_test.append(one_hot_label[int(l)])
        dlabel_train = temp_dlabel_train
        dlabel_test = temp_dlabel_test
    if dataset == "training":
        return dmat_train, dlabel_train
    elif dataset == "testing":
        return dmat_test, dlabel_test
    else:
        raise ValueError("dataset must be 'testing' or 'training'")
コード例 #4
0
ファイル: dataset.py プロジェクト: becxer/pytrain
def load_iris(path=".", dataset="training", one_hot = False):
    data_path = download_data(path, "iris")
    sample_data = os.path.join(data_path, "iris.csv")    
    dmat_train, dlabel_train, dmat_test, dlabel_test \
      = fs.csv_loader(sample_data, 0.2)
    if one_hot:
        one_hot_label = [[1,0,0], [0,1,0], [0,0,1]]
        temp_dlabel_train = []
        temp_dlabel_test = []
        for l in dlabel_train:
            temp_dlabel_train.append(one_hot_label[int(l)])
        for l in dlabel_test:
            temp_dlabel_test.append(one_hot_label[int(l)])
        dlabel_train = temp_dlabel_train
        dlabel_test = temp_dlabel_test
    if dataset == "training":
        return dmat_train, dlabel_train
    elif dataset == "testing":
        return dmat_test, dlabel_test
    else:
        raise ValueError("dataset must be 'testing' or 'training'")
コード例 #5
0
def load_iris(path=".", dataset="training", one_hot=False):
    data_path = download_data(path, "iris")
    sample_data = os.path.join(data_path, "iris.csv")
    dmat_train, dlabel_train, dmat_test, dlabel_test \
      = fs.csv_loader(sample_data, 0.2)
    dmat_train = map(lambda row: map(float, row), dmat_train)
    dmat_test = map(lambda row: map(float, row), dmat_test)
    if one_hot:
        one_hot_label = map(list, list(np.eye(3)))
        temp_dlabel_train = []
        temp_dlabel_test = []
        for l in dlabel_train:
            temp_dlabel_train.append(one_hot_label[int(l)])
        for l in dlabel_test:
            temp_dlabel_test.append(one_hot_label[int(l)])
        dlabel_train = temp_dlabel_train
        dlabel_test = temp_dlabel_test
    if dataset == "training":
        return dmat_train, dlabel_train
    elif dataset == "testing":
        return dmat_test, dlabel_test
    else:
        raise ValueError("dataset must be 'testing' or 'training'")