Esempio n. 1
0
def get_subjects_sessions_dictionary(input_subjects,
                                     cache,
                                     resultdir,
                                     prefix,
                                     dbfile,
                                     useSentinal,
                                     shuffle=False):
    import random
    _temp = OpenSubjectDatabase(cache, ['all'], prefix, dbfile)
    if "all" in input_subjects:
        input_subjects = _temp.getAllSubjects()
    if useSentinal:
        print("=" * 80)
        print("Using Sentinal Files to Limit Jobs Run")
        _all_subjects = set(input_subjects)
        _processed_subjects = set(
            get_processed_subjects(resultdir, input_subjects))
        subjects = list(_all_subjects - _processed_subjects
                        )  #NOTE - in set operation notation removes values
    else:
        subjects = input_subjects

    if shuffle:
        random.shuffle(
            subjects)  # randomly shuffle to get max cluster efficiency
    subject_sessions_dictionary = dict()
    for subject in subjects:
        subject_sessions_dictionary[subject] = _temp.getSessionsFromSubject(
            subject)
    return subjects, subject_sessions_dictionary
Esempio n. 2
0
def get_subjects(subjects, cache, prefix, dbfile, shuffle=True):
    import random
    _temp = OpenSubjectDatabase(cache, ['all'], prefix, dbfile)
    if "all" in subjects:
        subjects = _temp.getAllSubjects()
    if shuffle:
        random.shuffle(subjects)  # randomly shuffle to get max
    return subjects
Esempio n. 3
0
def get_subjects(argv, cache, prefix, dbfile, shuffle=True):
    import random
    _temp = OpenSubjectDatabase(cache, ['all'], prefix, dbfile)
    subjects = argv["--subject"]  #.split(',')
    if "all" in subjects:
        subjects = _temp.getAllSubjects()
    if shuffle:
        random.shuffle(subjects)  # randomly shuffle to get max
    return subjects
Esempio n. 4
0
def get_subjects_sessions_dictionary(input_subjects, cache, resultdir, prefix, dbfile, useSentinal, shuffle=False):
    import random
    _temp = OpenSubjectDatabase(cache, ['all'], prefix, dbfile)
    if "all" in input_subjects:
        input_subjects =  _temp.getAllSubjects();
    if useSentinal:
        print("="*80)
        print("Using Sentinal Files to Limit Jobs Run")
        _all_subjects = set(input_subjects )
        _processed_subjects = set( get_processed_subjects( resultdir, input_subjects ) )
        subjects = list( _all_subjects - _processed_subjects ) #NOTE - in set operation notation removes values
    else:
        subjects = input_subjects

    if shuffle:
        random.shuffle(subjects)  # randomly shuffle to get max cluster efficiency
    subject_sessions_dictionary = dict()
    for subject in subjects:
        subject_sessions_dictionary[subject]=_temp.getSessionsFromSubject(subject)
    return subjects,subject_sessions_dictionary