[['PatientID', 'SliceID', 'SOPInstanceUID']+poscols].reset_index(drop=True) tstmdf = tstmdf.sort_values(['SliceID']+poscols)\ [['PatientID', 'SliceID', 'SOPInstanceUID']+poscols].reset_index(drop=True) trnmdf['seq'] = (trnmdf.groupby(['SliceID']).cumcount() + 1) tstmdf['seq'] = (tstmdf.groupby(['SliceID']).cumcount() + 1) keepcols = ['PatientID', 'SliceID', 'SOPInstanceUID', 'seq'] trnmdf = trnmdf[keepcols] tstmdf = tstmdf[keepcols] trnmdf.columns = tstmdf.columns = ['PatientID', 'SliceID', 'Image', 'seq'] # Load Data Frames trndf = loadobj(os.path.join(path_emb, 'loader_trn_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data valdf = loadobj(os.path.join(path_emb, 'loader_val_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data tstdf = loadobj(os.path.join(path_emb, 'loader_tst_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data trndf['embidx'] = range(trndf.shape[0]) valdf['embidx'] = range(valdf.shape[0]) tstdf['embidx'] = range(tstdf.shape[0]) trndf = trndf.merge(trnmdf.drop('PatientID', 1), on = 'Image') valdf = valdf.merge(trnmdf.drop('PatientID', 1), on = 'Image') tstdf = tstdf.merge(tstmdf, on = 'Image') logger.info('Trn df shape {} {}'.format(*trndf.shape)) logger.info('Val df shape {} {}'.format(*valdf.shape)) logger.info('Tst df shape {} {}'.format(*tstdf.shape))
keepcols = ['PatientID', 'SOPInstanceUID', 'seq'] trnmdf = trnmdf[keepcols] trn2mdf = trn2mdf[keepcols] tstmdf = tstmdf[keepcols] tst2mdf = tst2mdf[keepcols] trnmdf.columns = trn2mdf.columns = tstmdf.columns = tst2mdf.columns = [ 'PatientID', 'Image', 'seq' ] # Load Data Frames # logger.info(os.listdir('/data/sdsml_prod/projects/data/ldc/rsna')) trndf = loadobj( os.path.join( path_emb, 'loader_trn_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data valdf = loadobj( os.path.join( path_emb, 'loader_val_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data tstdf = loadobj( os.path.join( path_emb, 'loader_tst_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data tst2df = loadobj( os.path.join( path_emb,