Beispiel #1
0
 def make_feed_dict(self, xs, advantage, returns, mask, train=True):
     feed_dict = create_x_feed_dict(self.ac_model.policy_input_vars, xs)
     feed_dict.update(create_x_feed_dict(self.ac_model.value_input_vars,
                                         xs))
     feed_dict.update(create_y_feed_dict(self.advantage, advantage))
     feed_dict.update(create_y_feed_dict(self.returns, returns))
     feed_dict.update({self.mask: mask})
     # if train:
     #     feed_dict.update(create_supp_train_feed_dict(self.q_model))
     # else:
     #     feed_dict.update(create_supp_test_feed_dict(self.q_model))
     return feed_dict
Beispiel #2
0
 def make_feed_dict(self, xs, value, returns, mask, train=True):
     feed_dict = create_x_feed_dict(self.ac_model.policy_input_vars, xs)
     feed_dict.update(create_x_feed_dict(
         self.ac_model.value_input_vars, xs))
     # feed_dict.update(create_y_feed_dict(self.advantage, advantage))
     feed_dict.update(create_y_feed_dict(self.pred_value, value))
     feed_dict.update(create_y_feed_dict(self.returns, returns))
     feed_dict.update({self.mask: mask})
     # if train:
     #     feed_dict.update(create_supp_train_feed_dict(self.q_model))
     # else:
     #     feed_dict.update(create_supp_test_feed_dict(self.q_model))
     return feed_dict
Beispiel #3
0
 def make_single_feed_dict(self, model, xs, y_var, y_val, train=True):
     feed_dict = create_x_feed_dict(model.get_input_vars(), xs)
     feed_dict.update(create_y_feed_dict(y_var, y_val))
     if train:
         feed_dict.update(create_supp_train_feed_dict(model))
     else:
         feed_dict.update(create_supp_test_feed_dict(model))
     return feed_dict
Beispiel #4
0
 def make_feed_dict(self, xs, y, mask, train=True):
     feed_dict = create_x_feed_dict(self.q_model.get_input_vars(), xs)
     feed_dict.update(create_y_feed_dict(self.y, y))
     feed_dict.update({self.mask: mask})
     if train:
         feed_dict.update(create_supp_train_feed_dict(self.q_model))
     else:
         feed_dict.update(create_supp_test_feed_dict(self.q_model))
     return feed_dict
Beispiel #5
0
 def make_feed_dict(self, xs, y, mask, train=True):
     feed_dict = create_x_feed_dict(self.q_model.get_input_vars(), xs)
     feed_dict.update(create_y_feed_dict(self.y, y))
     feed_dict.update({self.mask: mask})
     if train:
         feed_dict.update(create_supp_train_feed_dict(self.q_model))
     else:
         feed_dict.update(create_supp_test_feed_dict(self.q_model))
     return feed_dict
Beispiel #6
0
 def make_feed_dict(self, models, y_vars, inputs, train=True):
     feed_dict = {}
     for model_name, model in models.items():
         feed_dict.update(create_x_feed_dict(model.get_input_vars(),
                                             inputs[0][model_name]))
         feed_dict.update(create_y_feed_dict(y_vars[model_name],
                                             inputs[1][model_name]))
     if train:
         for model_name, model in models.items():
             feed_dict.update(create_supp_train_feed_dict(model))
     else:
         for model_name, model in models.items():
             feed_dict.update(create_supp_test_feed_dict(model))
     return feed_dict
Beispiel #7
0
 def perform_update(self, batch):
     feed_dict = create_x_feed_dict(self.model.get_input_vars(), batch)
     feed_dict.update(create_y_feed_dict(self.y, batch['y']))
     feed_dict.update(create_supp_train_feed_dict(self.model))
     self.train_step.run(feed_dict=feed_dict)
Beispiel #8
0
 def perform_update(self, batch):
     feed_dict = create_x_feed_dict(self.model.get_input_vars(), batch)
     feed_dict.update(create_y_feed_dict(self.y, batch['y']))
     feed_dict.update(create_supp_train_feed_dict(self.model))
     self.train_step.run(feed_dict=feed_dict)
Beispiel #9
0
 def compute(self, model, xs, y_var, y_val):
     feed_dict = create_x_feed_dict(model.input_vars, xs)
     feed_dict.update(create_y_feed_dict(y_var, y_val))
     feed_dict.update(create_supp_test_feed_dict(model))
     loss = self.loss.eval(feed_dict=feed_dict)
     return loss
Beispiel #10
0
 def compute(self, model, xs, y_var, y_val):
     feed_dict = create_x_feed_dict(model.input_vars, xs)
     feed_dict.update(create_y_feed_dict(y_var, y_val))
     feed_dict.update(create_supp_test_feed_dict(model))
     loss = self.loss.eval(feed_dict=feed_dict)
     return loss