Пример #1
0
# def test_geweke_lda():
if __name__ == "__main__":
    N_iter = 5000
    T = 3           # Number of topics
    D = 10         # Number of documents
    V = 20          # Number of words
    N = 20         # Number of words per document
    alpha_beta = 1.0

    # Generate synthetic data
    data = np.random.poisson(2, (D,V))
    data = csr_matrix(data)

    # Sample a GP
    model = StickbreakingCorrelatedLDA(data, T, alpha_beta=alpha_beta)

    # Run a Geweke test
    thetas = []
    betas = []
    for itr in progprint_xrange(N_iter):
        # Resample the data
        model.generate(N, keep=True)

        # Resample the parameters
        model.resample()

        # Update our samples
        thetas.append(model.theta.copy())
        betas.append(model.beta.copy())
Пример #2
0
    data = np.zeros((D, model.V),dtype=int)
    for d in xrange(D):
        doc = model.generate(N=N, keep=True)
        data[d,:] = doc.w

# def test_geweke_lda():
if __name__ == "__main__":
    N_iter = 50000
    T = 3           # Number of topics
    D = 10         # Number of documents
    V = 10          # Number of words
    N = 20         # Number of words per document
    alpha_beta = 1.0

    # Sample a GP
    model = StickbreakingCorrelatedLDA(T, V, alpha_beta=alpha_beta)

    # Run a Geweke test
    thetas = []
    betas = []
    for itr in progprint_xrange(N_iter):
        # Resample the data
        resample_data(model, D, N)

        # Resample the parameters
        model.resample_model()

        # Update our samples
        thetas.append(model.thetas.copy())
        betas.append(model.beta.copy())