def printstats(varr): return [("len: ", len(varr)), ("mean: ",mean(varr)), ("median: ",median(varr)), ("min ", min(varr)), ("max ", max(varr)), ("stdev:", pow(ca.var(varr),0.5) if len(varr) > 1 else "CANT COMPUTE len = 1")]
def _gfanalyze(notes,feature_list,fset_names=None): if fset_names is None: fsetnames = [ ('feature_%d' % i) for i in xrange(len(feature_list))] features = [] for feat in feature_list: features.append([feat(n).values()[0] for n in notes]) print "means: ",[mean(x) for x in features] print "vars: ",[ca.var(x) if len(x) > 1 else "ZEROLENGTH" for x in features ] print "max: ",[max(x) for x in features] print "min: ",[min(x) for x in features] # try: # for result in features: # print "-------------",fset_names[features.index(result)], "-------------------" # print r.stem(c([log(x+1)/log(2) for x in result])) # except: # print sys.exc_info(); return features