def getFreqRepr(X, D): freqX = OrderedDict() reprX = OrderedDict() for i, w in enumerate(X.words): freqX[w] = X.freq[i] reprX[w] = {j: X.features[i, j] for j in xrange(D)} return freqX, reprX # read input parameters if __name__ == '__main__': N = int(sys.argv[1]) D = int(sys.argv[2]) Nseed = int(sys.argv[3]) # make X,Y mock data (X, Y, pi) = make(N, Nseed, D) seed = [(i, i) for i in xrange(Nseed)] # write to CSV files freqX, reprX = getFreqRepr(X, D) freqY, reprY = getFreqRepr(Y, D) IO.writePickledWords('pockX.txt', freqX, reprX) IO.writePickledWords('pockY.txt', freqY, reprY) IO.writeWords('mockX.txt', X) IO.writeWords('mockY.txt', Y) IO.writeSeed('seedXY.txt', seed) print X.asTuple() # now need to save