amount = config.amount path = data.getDataDir(config.amount, config.cut, config.big) # gets all files fileList = os.listdir(path) fileExt = ".png" imgs = filter(lambda File: File[-4:] == fileExt, fileList) imgs.sort() print "Found %d %s images" % (len(imgs), fileExt) ranks, names, histograms = data.getBinnedHistograms(amount, cut=True, big=False) X = np.array([image.imgToArray(path+imgs[i]) for i in xrange(len(imgs))]) print X.shape, histograms.shape website_names = imgs BIN_HISTOGRAMS = {} IMG_ARRAYS = {} assert(len(names) == len(website_names)) for i in xrange(len(names)): assert(website_names[i] == names[i]) IMG_ARRAYS[names[i]] = X[i] BIN_HISTOGRAMS[names[i]] = histograms[i] names = np.array(names) def test(data, names, recommender, fractionTrain=.8, highFactor=.1, verbose=False): """ Parameters: