コード例 #1
0
import csv
import random
import DatabaseManager

# sub_set_features = [6,7,8,9,12,13,14,15,16,17,21,22,24,33,41,49]
sub_set_indexes = DatabaseManager.get_sub_feature_indexes()

data_reader = csv.reader(open("original_data.csv","rb"))
data_writer = csv.writer(open("subset_features_data.csv", "wb"))

header = data_reader.next()
header = [header[j] for j in sub_set_indexes]
data_writer.writerow(header)

patientEncounters = {}
readmitted = []
no_readmitted = []

for (index, row) in enumerate(data_reader):
	addRow = True

	if(row[1] in patientEncounters):
	#feature index 1 is patient_nbr
	#a encounter for this patient was already added
		addRow = False
		patientEncounters[row[1]] += 1
	else:
		patientEncounters[row[1]] = 1

	if(addRow and int(row[7]) in [13,14,19,20,21]):
	#feature index 7 is discharge_disposition