def buildDietTypeFreqTXTFile(): dietType_dict = {} f_diet = open('diet/dietOverallTypeFreq/all_dietType_frequency.txt','w') for line in open('diet/dietOverallItemFreq/all_diet_frequency.txt','r'): line = line.strip('\n') words = wordpunct_tokenize(line) #print words[0], type(words[1]) #words[0]: item #words[1]: item frequency diettype = dietType.dietType(words[0]) # print diettype temp = int(words[1]) if diettype != 'others': if diettype in dietType_dict: dietType_dict[diettype] += temp # print dietType_dict[diettype] # print type(dietType_dict[diettype]) else: dietType_dict[diettype] = temp # print dietType_dict[diettype] # print dietType_dict for key in dietType_dict: f_diet.write("%-25s%-10s"%(key,dietType_dict[key])) f_diet.write('\n') f_diet.close()
def build_daily_single_diet_index(subjectID, n): singleDietType_dict = {} for line in open( 'diet/dietItemFreq/diet_frequency_' + subjectID + '_' + str(n) + '.txt', 'r'): line = line.strip('\n') words = wordpunct_tokenize(line) #print words[0], type(words[1]) #words[0]: item #words[1]: item frequency diettype = dietType.dietType(words[0]) # print diettype temp = int(words[1]) if diettype != 'others': if diettype in singleDietType_dict: singleDietType_dict[diettype] += temp # print singleDietType_dict[diettype] # print type(singleDietType_dict[diettype]) else: singleDietType_dict[diettype] = temp # print singleDietType_dict[diettype] return singleDietType_dict
def build_daily_single_diet_index_with_time(subjectID, n): singleDietType_dict = {} temp = buildItemIndex.build_daily_single_diet_index_with_time(subjectID, n) for key1 in temp: singleDietType_dict[key1] = {} for key2 in temp[key1]: diettype = dietType.dietType(key2) freq = int(temp[key1][key2]) if diettype != 'others': if diettype in singleDietType_dict[key1]: singleDietType_dict[key1][diettype] += freq else: singleDietType_dict[key1][diettype] = freq # print singleDietType_dict return singleDietType_dict
def buildSingleDietExcel(subjectID): ''' build diet excel for single subject, including the date, diet item and type ''' file_location = 'subject_template_' + subjectID + '.xlsx' workbookR = xlrd.open_workbook(file_location) sheet = workbookR.sheet_by_index(3) workbookW = xlwt.Workbook() ws = workbookW.add_sheet('sheet1') rowW = 0 index = 0 for rowR in range(8, sheet.nrows): if sheet.cell_value(rowR, 0): ws.write(rowW, 0, subjectID) ws.write(rowW, 1, sheet.cell_value(rowR, 0)) index += 1 itemString = '' typeString = '' for line in open( 'diet/dietItemFreq/diet_frequency_' + subjectID + '_' + str(index) + '.txt', 'r'): line = line.strip('\n') words = wordpunct_tokenize(line) itemString = itemString + ' ' + words[0] type = dietType.dietType(words[0]) typeString = typeString + ' ' + type ws.write(rowW, 2, itemString) ws.write(rowW, 3, typeString) rowW += 1 workbookW.save('diet/dietTable_' + subjectID + '.xls')