Python MultiArmedBandit.get_hidden_states примеры использования

Язык программирования: Python

Пространство имен/Пакет: environments

Класс/Тип: MultiArmedBandit

Метод/Функция: get_hidden_states

Примеров на hotexamples.com: 2

Python MultiArmedBandit.get_hidden_states - 2 примера найдено. Это лучшие примеры Python кода для environments.MultiArmedBandit.get_hidden_states, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Основные методы

Показать Скрыть

MultiArmedBandit(3)

expected_performance(1)

get_hidden_states(1)

Пример #1

Показать файл

Файл: pmodels.py Проект: satpreetsingh/pyBefit

def main():

    from environments import MultiArmedBandit
    import seaborn as sns
    sns.set(style="white", palette="muted", color_codes=True)

    T = 100
    env = MultiArmedBandit(T)
    pm = RescorlaWagner(env, env.d_x)

    obs = env.get_observations()
    hst = env.get_hidden_states()

    #use isres for optimisation of one dimensional functions
    from optmethods import isres
    bounds = {'ub': np.array([1.]), 'lb': np.array([0.])}
    f_opt, x_opt, res = isres(pm.get_free_energy, 1, 1e-6, 1e-8, bounds,
                              np.array([0.5]))
    print(f_opt, x_opt, res)

    post = pm.get_beliefs(alpha=x_opt)

    ax = obs.plot(y=r'$o_t$', style='go')
    ax = hst.plot(y=r'$p_t$', style='k--', ax=ax)

    ax = post.plot(y=r'$\mu_t$', style='r-', ax=ax)
    ax.legend(numpoints=1)

    #optimize preceptual surprise over multiple experimental blocks

    def total_fe(x, n_pars, blocks):
        fe = 0
        for b in blocks:
            pm = RescorlaWagner(b, b.d_x)
            fe += pm.get_free_energy(x)

        return fe

    n = 100
    T = 100
    exp_blocks = [MultiArmedBandit(T)] * 100

    fe = lambda x, p: total_fe(x, p, exp_blocks)
    f_opt, x_opt, res = isres(fe, 1, 1e-6, 1e-8, bounds, np.array([0.5]))
    print(f_opt / n, x_opt, res)

    post = pm.get_beliefs(alpha=x_opt)

    ax = obs.plot(y=r'$o_t$', style='go')
    ax = hst.plot(y=r'$p_t$', style='k--', ax=ax)

    ax = post.plot(y=r'$\mu_t$', style='r-', ax=ax)
    ax.legend(numpoints=1)

Пример #2

Показать файл

Файл: pmodels.py Проект: dimarkov/pyBefit

def main():
    
    from environments import MultiArmedBandit
    import seaborn as sns
    sns.set(style = "white", palette="muted", color_codes=True)
    
    T = 100
    env = MultiArmedBandit(T)
    pm = RescorlaWagner(env, env.d_x)
    
    obs = env.get_observations()
    hst = env.get_hidden_states()
    
    #use isres for optimisation of one dimensional functions
    from optmethods import isres
    bounds = {'ub': np.array([1.]), 'lb': np.array([0.])}
    f_opt, x_opt, res = isres( pm.get_free_energy, 1, 1e-6, 1e-8, bounds, np.array([0.5]) )
    print(f_opt, x_opt, res)
    
    post = pm.get_beliefs(alpha = x_opt)

    
    ax = obs.plot(y = r'$o_t$', style = 'go')
    ax = hst.plot(y = r'$p_t$', style = 'k--', ax = ax)
    
    ax = post.plot(y = r'$\mu_t$', style = 'r-', ax = ax)
    ax.legend(numpoints = 1)
    
    #optimize preceptual surprise over multiple experimental blocks
    
    def total_fe(x, n_pars, blocks):
        fe = 0
        for b in blocks:
            pm = RescorlaWagner(b, b.d_x)
            fe += pm.get_free_energy(x)
            
        return fe
    
    n = 100
    T = 100
    exp_blocks = [MultiArmedBandit(T)]*100 
        
    fe = lambda x,p: total_fe(x, p, exp_blocks)
    f_opt, x_opt, res = isres( fe, 1, 1e-6, 1e-8, bounds, np.array([0.5]) )
    print(f_opt/n, x_opt, res)
    
    post = pm.get_beliefs(alpha = x_opt)
    
    ax = obs.plot(y = r'$o_t$', style = 'go')
    ax = hst.plot(y = r'$p_t$', style = 'k--', ax = ax)
    
    ax = post.plot(y = r'$\mu_t$', style = 'r-', ax = ax)
    ax.legend(numpoints = 1)