Пример #1
0
                [['PatientID', 'SliceID', 'SOPInstanceUID']+poscols].reset_index(drop=True)
tstmdf = tstmdf.sort_values(['SliceID']+poscols)\
                [['PatientID', 'SliceID', 'SOPInstanceUID']+poscols].reset_index(drop=True)

trnmdf['seq'] = (trnmdf.groupby(['SliceID']).cumcount() + 1)
tstmdf['seq'] = (tstmdf.groupby(['SliceID']).cumcount() + 1)

keepcols = ['PatientID', 'SliceID', 'SOPInstanceUID', 'seq']
trnmdf = trnmdf[keepcols]
tstmdf = tstmdf[keepcols]

trnmdf.columns = tstmdf.columns = ['PatientID', 'SliceID', 'Image', 'seq']


# Load Data Frames
trndf = loadobj(os.path.join(path_emb, 'loader_trn_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data
valdf = loadobj(os.path.join(path_emb, 'loader_val_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data
tstdf = loadobj(os.path.join(path_emb, 'loader_tst_size{}_fold{}_ep{}'.format(SIZE, fold, GLOBALEPOCH))).dataset.data

trndf['embidx'] = range(trndf.shape[0])
valdf['embidx'] = range(valdf.shape[0])
tstdf['embidx'] = range(tstdf.shape[0])

trndf = trndf.merge(trnmdf.drop('PatientID', 1), on = 'Image')
valdf = valdf.merge(trnmdf.drop('PatientID', 1), on = 'Image')
tstdf = tstdf.merge(tstmdf, on = 'Image')

logger.info('Trn df shape {} {}'.format(*trndf.shape))
logger.info('Val df shape {} {}'.format(*valdf.shape))
logger.info('Tst df shape {} {}'.format(*tstdf.shape))
Пример #2
0
keepcols = ['PatientID', 'SOPInstanceUID', 'seq']
trnmdf = trnmdf[keepcols]
trn2mdf = trn2mdf[keepcols]
tstmdf = tstmdf[keepcols]
tst2mdf = tst2mdf[keepcols]

trnmdf.columns = trn2mdf.columns = tstmdf.columns = tst2mdf.columns = [
    'PatientID', 'Image', 'seq'
]

# Load Data Frames

# logger.info(os.listdir('/data/sdsml_prod/projects/data/ldc/rsna'))
trndf = loadobj(
    os.path.join(
        path_emb,
        'loader_trn_size{}_fold{}_ep{}'.format(SIZE, fold,
                                               GLOBALEPOCH))).dataset.data
valdf = loadobj(
    os.path.join(
        path_emb,
        'loader_val_size{}_fold{}_ep{}'.format(SIZE, fold,
                                               GLOBALEPOCH))).dataset.data
tstdf = loadobj(
    os.path.join(
        path_emb,
        'loader_tst_size{}_fold{}_ep{}'.format(SIZE, fold,
                                               GLOBALEPOCH))).dataset.data
tst2df = loadobj(
    os.path.join(
        path_emb,