#setting a string with step parameters step_params = ' ' + measure_fname + ' ' + mdir absolute_str = '' if absval: absolute_str = ' ' + au.abs_str() step_params += absolute_str leave_str = '' if leave > -1: leave_str = ' excluding subject ' + str(leave) step_params += leave_str #checking if this measure has already been done endstep = au.measure_str() + step_params stepdone = au.is_done(chkf, endstep) #add pluses to output dir if it already exists if stepdone: while os.path.exists(mdir): mdir += '+' else: #work in the last folder used plus = False while os.path.exists(mdir): mdir += '+' plus = True if plus: mdir = mdir[0:-1] #setting statsdir
def group_distance (measure_function, datadir, groups, groupsizes, chkf, absolute=False, outdir='', foldno='', expname='', exclude_idx=-1, exclude_subj='', exclude_subjclass=''): olddir = os.getcwd() if not outdir: outdir = datadir ngroups = len(groups) #matrix of strings of 2000 characters maximum, to save filepaths gfnames = np.zeros ([ngroups,3], dtype=np.dtype('a2000')) subject_excluded = False for g1 in range(ngroups): g1name = groups[g1] #mean1fname gfnames[g1,0] = datadir + os.path.sep + g1name + '_' + au.mean_str() #var1fname gfnames[g1,1] = datadir + os.path.sep + g1name + '_' + au.var_str() #std1fname gfnames[g1,2] = datadir + os.path.sep + g1name + '_' + au.std_str() for g2 in range(g1+1, ngroups): g2name = groups[g2] gfnames[g2,0] = datadir + os.path.sep + g2name + '_' + au.mean_str() gfnames[g2,1] = datadir + os.path.sep + g2name + '_' + au.var_str() gfnames[g2,2] = datadir + os.path.sep + g2name + '_' + au.std_str() experiment = g1name + '_vs_' + g2name #check if exclude_subjclass is any of both current groups eg = -1 if exclude_idx > -1: if exclude_subjclass == g1name: eg = g2 elif exclude_subjclass == g2name: eg = g1 step = au.measure_str() + ' ' + measure_function.func_name + ' ' + experiment + ' ' + datadir #remove subject from stats if eg > -1: exclude_str = '_' + au.excluded_str() + str(exclude_idx) step += exclude_str experiment += exclude_str if not au.is_done(chkf, step): if not subject_excluded: newmeanfname = gfnames[eg,0] + exclude_str newvarfname = gfnames[eg,1] + exclude_str newstdfname = gfnames[eg,2] + exclude_str rstep = au.remove_str() + ' ' + au.subject_str() + ' ' + str(exclude_subj) + ' ' + au.fromstats_str() + ' ' + datadir if not au.is_done(chkf, rstep): #(meanfname, varfname, samplesize, subjvolfname, newmeanfname, newvarfname, newstdfname='') remove_subject_from_stats (gfnames[eg,0], gfnames[eg,1], groupsizes[eg][1], exclude_subj, newmeanfname, newvarfname, newstdfname) au.checklist_add (chkf, rstep) gfnames[eg,0] += exclude_str gfnames[eg,1] += exclude_str gfnames[eg,2] += exclude_str groupsizes[eg][1] -= 1 subject_excluded = True #calculating distance if not au.is_done(chkf, step): mean1fname = au.add_extension_if_needed (gfnames[g1,0], au.ext_str()) mean2fname = au.add_extension_if_needed (gfnames[g2,0], au.ext_str()) var1fname = au.add_extension_if_needed (gfnames[g1,1], au.ext_str()) var2fname = au.add_extension_if_needed (gfnames[g2,1], au.ext_str()) std1fname = au.add_extension_if_needed (gfnames[g1,2], au.ext_str()) std2fname = au.add_extension_if_needed (gfnames[g2,2], au.ext_str()) outfname = measure_function (mean1fname, mean2fname, var1fname, var2fname, std1fname, std2fname, groupsizes[g1][1], groupsizes[g2][1], experiment, outdir, exclude_idx) if absolute: change_to_absolute_values (outfname) au.checklist_add (chkf, step) return outfname
#setting a string with step parameters step_params = ' ' + measure_fname + ' ' + mdir absolute_str = '' if absval: absolute_str = ' ' + au.abs_str() step_params += absolute_str leave_str = '' if leave > -1: leave_str = ' excluding subject ' + str(leave) step_params += leave_str #checking if this measure has already been done endstep = au.measure_str() + step_params stepdone = au.is_done(chkf, endstep) #add pluses to output dir if it already exists if stepdone: while os.path.exists (mdir): mdir += '+' else: #work in the last folder used plus = False while os.path.exists (mdir): mdir += '+' plus = True if plus: mdir = mdir[0:-1] #setting statsdir
def group_distance(measure_function, datadir, groups, groupsizes, chkf, absolute=False, outdir='', foldno='', expname='', exclude_idx=-1, exclude_subj='', exclude_subjclass=''): olddir = os.getcwd() if not outdir: outdir = datadir ngroups = len(groups) #matrix of strings of 2000 characters maximum, to save filepaths gfnames = np.zeros([ngroups, 3], dtype=np.dtype('a2000')) subject_excluded = False for g1 in range(ngroups): g1name = groups[g1] #mean1fname gfnames[g1, 0] = datadir + os.path.sep + g1name + '_' + au.mean_str() #var1fname gfnames[g1, 1] = datadir + os.path.sep + g1name + '_' + au.var_str() #std1fname gfnames[g1, 2] = datadir + os.path.sep + g1name + '_' + au.std_str() for g2 in range(g1 + 1, ngroups): g2name = groups[g2] gfnames[g2, 0] = datadir + os.path.sep + g2name + '_' + au.mean_str() gfnames[g2, 1] = datadir + os.path.sep + g2name + '_' + au.var_str() gfnames[g2, 2] = datadir + os.path.sep + g2name + '_' + au.std_str() experiment = g1name + '_vs_' + g2name #check if exclude_subjclass is any of both current groups eg = -1 if exclude_idx > -1: if exclude_subjclass == g1name: eg = g2 elif exclude_subjclass == g2name: eg = g1 step = au.measure_str( ) + ' ' + measure_function.func_name + ' ' + experiment + ' ' + datadir #remove subject from stats if eg > -1: exclude_str = '_' + au.excluded_str() + str(exclude_idx) step += exclude_str experiment += exclude_str if not au.is_done(chkf, step): if not subject_excluded: newmeanfname = gfnames[eg, 0] + exclude_str newvarfname = gfnames[eg, 1] + exclude_str newstdfname = gfnames[eg, 2] + exclude_str rstep = au.remove_str() + ' ' + au.subject_str( ) + ' ' + str(exclude_subj) + ' ' + au.fromstats_str( ) + ' ' + datadir if not au.is_done(chkf, rstep): #(meanfname, varfname, samplesize, subjvolfname, newmeanfname, newvarfname, newstdfname='') remove_subject_from_stats(gfnames[eg, 0], gfnames[eg, 1], groupsizes[eg][1], exclude_subj, newmeanfname, newvarfname, newstdfname) au.checklist_add(chkf, rstep) gfnames[eg, 0] += exclude_str gfnames[eg, 1] += exclude_str gfnames[eg, 2] += exclude_str groupsizes[eg][1] -= 1 subject_excluded = True #calculating distance if not au.is_done(chkf, step): mean1fname = au.add_extension_if_needed( gfnames[g1, 0], au.ext_str()) mean2fname = au.add_extension_if_needed( gfnames[g2, 0], au.ext_str()) var1fname = au.add_extension_if_needed(gfnames[g1, 1], au.ext_str()) var2fname = au.add_extension_if_needed(gfnames[g2, 1], au.ext_str()) std1fname = au.add_extension_if_needed(gfnames[g1, 2], au.ext_str()) std2fname = au.add_extension_if_needed(gfnames[g2, 2], au.ext_str()) outfname = measure_function(mean1fname, mean2fname, var1fname, var2fname, std1fname, std2fname, groupsizes[g1][1], groupsizes[g2][1], experiment, outdir, exclude_idx) if absolute: change_to_absolute_values(outfname) au.checklist_add(chkf, step) return outfname