Python MathHelper示例

编程语言: Python

命名空间/包名称: Helpers.math_helper

类/类型: MathHelper

hotexamples.com的示例: 7

Python MathHelper - 已找到7个示例。这些是从开源项目中提取的最受好评的Helpers.math_helper.MathHelper现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

get_bernoulli_sample(2)

func_of_pi(2)

get_uniform_sample(2)

natural_logarithm(2)

ceiled_log_base_2(1)

示例#1

显示文件

文件： multi_armed_bandit.py 项目： rama56/MAB_Simulator

    def analyse_suboptimal_arm_pulls(self):
        # Compute deltas and theoretical upper bound of playing each sub-optimal arm.
        self.best_arm = mh.get_maximum_index(self.true_means)
        mean_of_best_arm = self.true_means[self.best_arm]

        for i in range(self.K):
            self.deltas[i] = mean_of_best_arm - self.true_means[i]

        del_sq_invs = mh.get_instance_dependent_square_inverses(
            self.deltas, self.best_arm)

        addi_constant = rvh.func_of_pi(add=1, power=2, mult=1 / 3)

        time_series = np.arange(self.T + 1)

        logarithmic_time_series = rvh.natural_logarithm(time_series)

        a = np.array(del_sq_invs)
        del_sq_inv_row_matrix = np.reshape(a, (1, -1))
        logarithmic_time_series_column_matrix = np.reshape(
            logarithmic_time_series, (-1, 1))

        matrix = np.dot(logarithmic_time_series_column_matrix,
                        del_sq_inv_row_matrix)

        self.theoretical_bounds_arm_pulls = matrix + addi_constant

示例#2

显示文件

    def test_library_random_variables(self):

        # Uniform distribution
        result_1 = rvh.get_uniform_sample(0, 1, 10)

        # Bernoulli distribution
        result_2 = rvh.get_bernoulli_sample(0.8)

        result_3 = rvh.get_bernoulli_sample(p=0.5, size=10)

        a = 5

示例#3

显示文件

文件： ucb_doubling.py 项目： rama56/MAB_Simulator

    def play_arms(self):
        rewards = [0]
        n = 0

        # At time t = 0,
        for i in range(1, self.K + 1):
            arm_number = i - 1
            reward = super().pull_arm(arm_number)
            rewards.append(reward)

            n = n + 1

        # From time t = 1
        for t in range(1, rvh.ceiled_log_base_2(self.N) + 1):
            self.revise_ucbs(n)

            # pull the arm with highest UCB 2 power t times
            pulls_this_iteration = 2**t

            arm_with_highest_ucb = mh.get_maximum_index(
                self.upper_confidence_bound)

            for i in range(pulls_this_iteration):
                if n >= self.N:
                    break

                reward = super().pull_arm(arm_with_highest_ucb)
                rewards.append(reward)
                n = n + 1
            # end for
        # end for

        return rewards

示例#4

显示文件

    def get_arms(arm_count, tape_size):
        true_means = rvh.get_uniform_sample(0, 1, arm_count)
        arms = []
        for i in range(arm_count):
            arm = Arm(true_means[i], size=tape_size)
            arms.append(arm)

        return true_means, arms

示例#5

显示文件

文件： multi_armed_bandit.py 项目： rama56/MAB_Simulator

    def analyse_common_stats(self):
        # Compute deltas and theoretical upper bound of regret of UCB1.
        self.best_arm = mh.get_maximum_index(self.true_means)
        mean_of_best_arm = self.true_means[self.best_arm]

        for i in range(self.K):
            self.deltas[i] = mean_of_best_arm - self.true_means[i]

        sum_del_inv, sum_del = mh.get_instance_dependent_values(
            self.best_arm, self.deltas)

        mult_constant, addi_constant = mh.get_theoretical_constants(
            sum_del_inv, sum_del)

        time_series = np.arange(self.T + 1)
        self.cum_regret_theo_bound = mult_constant * rvh.natural_logarithm(
            time_series) + addi_constant
        self.cum_optimal_reward = time_series * mean_of_best_arm

示例#6

显示文件

    def get_theoretical_constants(sum_del_inv, sum_del):
        mult_constant = 2 * sum_del_inv
        addi_constant = rvh.func_of_pi(add=1, power=2, mult=1 / 3) * sum_del

        return mult_constant, addi_constant

示例#7

显示文件

    def __init__(self, mean, size=10**7):
        self._mean = mean

        # Create a tape of values to return.
        self._tape = rvh.get_bernoulli_sample(p=self._mean, size=size)
        self._tape_index = 0