def start_model_server(self, model_server): if model_server.name() != self._task_name: return model_server = get_model_server_by_name(self._task_name) model_server_adapter = ModelServerAdapter( self._zk_addr, self._model_server.index(self._task_name) + 1, self._task_index, model_server.forward_cache, model_server.backward_cache, model_server.dtype()) model_server_adapter.init() model_server.init_server(model_server_adapter) with model_scope("ams_gear_forward"): while True: try: connect_to_client(self._zk_addr, '') if variable_registers() is not None: execute(variable_registers()) execute(global_initializers()) break except PsError as e: traceback.print_exc() time.sleep(10) model_server.run_server() while True: try: while True: print "RESTARTING CLIENT" if restart_client(): break time.sleep(10) execute_loop_wait() except PsError as e: traceback.print_exc() time.sleep(10)
def create_session(self): scopes = list(get_model_scopes()) if global_variables(scopes) is None or\ len(global_variables(scopes)) == 0: return execute_with_retry(variable_registers(scopes)) execute_with_retry(global_initializers(scopes))
def create_session(self): if global_variables() is None or len(global_variables()) == 0: return execute_with_retry(variable_registers()) var_set = set(global_variables()) while len(var_set) > 0: for var in global_variables(): if var not in var_set: continue inited = execute_with_retry([var.is_initialized_op]) if inited == [1]: var_set.remove(var) else: print('waiting for initialize variable[%s]' % var.name) if is_local_mode(): time.sleep(0.1) else: time.sleep(3)
def create_session(self): if global_variables() is None or\ len(global_variables()) == 0: return execute_with_retry(variable_registers()) execute_with_retry(global_initializers())