Python DataLoader.clean_data 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: data_loader

클래스/타입: DataLoader

메소드/함수: clean_data

hotexamples.com에서의 예제들: 3

Python DataLoader.clean_data - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 data_loader.DataLoader.clean_data에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

DataLoader(30)

create_batches(9)

convert_df_to_arrays(4)

gen_data(4)

convert_to_char(4)

data_iterator(4)

generate(3)

batch_unpack_image_sequence(3)

_write_nifti(3)

getHistoryRange(3)

change_file(3)

fetch_batch(3)

data_generator(3)

clean_data(3)

create_tf_dataset(3)

_load_file(2)

create_random_ordering(2)

create_dataset(2)

data_batch(2)

createRecoData(2)

add_dataset(2)

convert_sentence_to_indices(2)

astype(2)

generator(2)

getFeatures(2)

build_vocab(2)

build_data(2)

filter_by_nodes(2)

gen(1)

format_file_list(1)

form_sentences(1)

filter_multicolor(1)

filter_latest_questions(1)

fetch_val_batch(1)

gen_batch_data(1)

arrange_data(1)

_make_dataset(1)

gen_iterator(1)

gen_tfrecords(1)

generate_positive_samples(1)

generate_train_data(1)

generate_train_test(1)

getAllHistory(1)

getAllPersons(1)

getBatch(1)

getData(1)

getFuture(1)

getSetLen(1)

load_order_list(1)

fetch_train_batch(1)

예제 #1

파일 보기

class Experiment:
    def __init__(self):
        self.data_loader = DataLoader('/data')
        self.trainer = Trainer()

    def run(self):
        train_data, train_labels = self.data_loader.load_set('train')

        test_data, test_labels = self.data_loader.load_set('test')

        train_data = self.data_loader.clean_data(train_data)
        test_data = self.data_loader.clean_data(test_data)

        self.trainer.train(train_data, train_labels)

        train_predictions = self.trainer.predict(train_data)
        test_predictions = self.trainer.predict(test_data)

        print('Train accuracy: ',
              self.compute_score(train_labels, train_predictions))
        print('Test accuracy: ',
              self.compute_score(test_labels, test_predictions))

    def compute_score(self, labels, predictions):
        return metrics.accuracy_score(labels, predictions)

예제 #2

파일 보기

    method and compares them
'''
#%%
# Read the data:
data = DataLoader(dataset_name='trade_selection', extension='csv')
split = int(data.df.shape[0] * 0.8)

# Compute a threshold to create the label:
threshold_ = analysis_threshold(data.df, split)

# Some plots of the variable Result:
plot_result(data.df)
plot_hist(data.df)

# Clean the data:
datas = data.clean_data(threshold=threshold_)
old_df = datas.copy()
datas = datas.drop(['Result'], axis=1)

# Split the train_test and evaluation set:
train_evaluation_set = datas.iloc[:split, :]
test_set = datas.iloc[split:, :]

# Get the block variables:
list_var = data.get_list_var_block()

#%% OCA method
oca_method = OCAMethod(train_evaluation_set,
                       n_min=10,
                       verbose=True,
                       reload_feature_importance=False,

예제 #3

파일 보기

@author: david.saltiel
"""

from data_loader import DataLoader
from OCA import OCAMethod
from RFE import RFEMethod
from BCA import BCAMethod
from graphics import create_graphic_for_method, create_figure2, create_figure3

''' This is the main function
    It calls all the 3 features selection
    method and compares them
'''
#%% reads the data
data = DataLoader(dataset_name = 'trade_selection_A229', extension = 'csv')
data.clean_data()

#%% OCA method
oca_method = OCAMethod(data.df, n_min=10, verbose = True,reload_feature_importance = False)
oca_method.select_features()

#%% RFE method
rfe_method = RFEMethod(data.df, verbose = True)
rfe_method.select_features()
rfe_dictionary = rfe_method.save_all_score()

#%% BCA method
bca_method = BCAMethod(data.df, verbose = True)
bca_method.select_features()