Python Settings.add_count Examples

Programming Language: Python

Namespace/Package Name: utils

Class/Type: Settings

Method/Function: add_count

Examples at hotexamples.com: 2

Python Settings.add_count - 2 examples found. These are the top rated real world Python examples of utils.Settings.add_count extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Settings(30)

add_reflector(17)

add_entry_wheel(16)

add_rotors(16)

init(13)

get(8)

load_root(5)

get_saved(5)

set(5)

get_count(3)

load_config(3)

createWindow(2)

returnBuilder(2)

load_grad(2)

grad_sum(2)

fileName(2)

add_count(2)

mask(1)

load_hackpolicy(1)

load_lock(1)

load_policy(1)

add_rotor(1)

load_settings(1)

locate_file(1)

batch_norm(1)

model_weights(1)

kl(1)

notrain(1)

num_dataset(1)

otanh(1)

powerDepth(1)

predict(1)

recentModels(1)

remove_all_rotors(1)

remove_rotor(1)

s(1)

nopadding(1)

allFalse(1)

is_rescan_forced(1)

get_entry_wheel_data(1)

create_window(1)

dataset(1)

depth(1)

epe(1)

filters(1)

allow_insecure(1)

get_access_log_path(1)

get_builder(1)

get_cache_path(1)

get_error_log_path(1)

Example #1

Show file

File: HackA2CPolicy.py Project: WowCZ/strac

    def train(self):
        '''
        call this function when the episode ends
        '''

        if not self.is_training:
            self.logger.info("Not in training mode")
            return
        else:
            self.logger.info("Update a2c policy parameters.")

        self.episodecount += 1
        self.logger.info("Sample Num so far: %s" % self.samplecount)
        self.logger.info("Episode Num so far: %s" % self.episodecount)

        Settings.add_count()
        globalEpisodeCount = copy.deepcopy(Settings.get_count())
        self.loadLastestPolicy()

        if self.samplecount >= self.minibatch_size * 1 and globalEpisodeCount % self.training_frequency == 0:
            self.logger.info('start training...')

            assert len(Settings.global_policysaver) == Settings.global_threadsnum
            # self.dqn.reset_noise()
            total_batch_size = 0
            for k, thread_policy in Settings.global_policysaver.items():
                s_batch, a_batch_one_hot, V_trace, advantage = Settings.global_hackpolicysaver[k]._sample_and_updateV()
                grad, batch_size = thread_policy.train(s_batch, a_batch_one_hot, V_trace, advantage)
                total_batch_size += batch_size
                Settings.load_grad(grad, k)

            assert len(Settings.global_gradsaver) == Settings.global_threadsnum
            grads_list = Settings.grad_sum()
            self._load_and_update(grads_list, total_batch_size)
            self.savePolicyInc()

Example #2

Show file

File: HackRBPolicy.py Project: WowCZ/strac

    def train(self):
        '''
        call this function when the episode ends
        '''

        # print(threading.currentThread().getName() + ' Domain: ' +self.domainString + ' Training')

        if not self.is_training:
            self.logger.info("Not in training mode")
            return
        else:
            self.logger.info("Update dqn policy parameters.")

        self.episodecount += 1

        # lock = Settings.load_lock()
        # lock.acquire()
        # try:
        Settings.add_count()
        globalEpisodeCount = copy.deepcopy(Settings.get_count())

        # print('###################################################')
        # print(threading.currentThread().getName() + ' ' + str(globalEpisodeCount))

        self.logger.info("Sample Num so far: %s" % (self.samplecount))
        self.logger.info("Episode Num so far: %s" % (self.episodecount))

        # if self.samplecount >= self.minibatch_size * 10 and self.episodecount % self.training_frequency == 0:
        if self.samplecount >= self.minibatch_size * 10 and globalEpisodeCount % self.training_frequency == 0:
            self.logger.info('start training...')

            # print('reshaped_targetdis_shape: ')
            # print(reshaped_targetdis.shape)
            # print('a_batch_one_hot_shape: ')
            # print(a_batch_one_hot.shape)

            assert len(Settings.global_policysaver) == Settings.global_threadsnum
            # self.dqn.reset_noise()
            total_batch_size = 0
            for k, v in Settings.global_policysaver.items():
                s_batch, a_batch_one_hot, reshaped_targetdis = Settings.global_hackpolicysaver[k]._sample_and_updateQ()
                grad, batch_size = Settings.global_policysaver[k].train(s_batch, a_batch_one_hot, reshaped_targetdis)
                total_batch_size += batch_size
                Settings.load_grad(grad, k)

            assert len(Settings.global_gradsaver) == Settings.global_threadsnum
            grads_list = Settings.grad_sum()
            self._load_and_update(grads_list, self.minibatch_size)
            self._savePolicyInc()