Ejemplos de DNN.save en Python

Lenguaje de programación: Python

Namespace/Package Name: model

Clase / Tipo: DNN

Método / Función: save

Ejemplos en hotexamples.com: 2

Python DNN.save - 2 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de model.DNN.save extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Métodos usados con frecuencia

Mostrar Ocultar

DNN(29)

parameters(10)

fit(7)

load_state_dict(7)

state_dict(6)

to(5)

eval(5)

train(4)

compile(3)

predict(3)

embeddings(2)

summary(2)

save(2)

set_save_path(1)

save_weights(1)

model(1)

predict_proba(1)

predict_classes(1)

updata(1)

out(1)

save_session(1)

load_model(1)

load_weights(1)

DomainPredictor(1)

load(1)

inference(1)

forward(1)

fc5(1)

fc4(1)

cuda(1)

cross_entropy_loss(1)

build_model(1)

backward(1)

apply(1)

accuracy(1)

Predictor(1)

Feature(1)

zero_grad(1)

Ejemplo n.º 1

Mostrar archivo

Archivo: agent.py Proyecto: denishuenniger/open-ai

class Agent:
    """
    Class representing a learning agent acting in an environment.
    """
    def __init__(self,
                 p,
                 lr,
                 game="CartPole-v1",
                 mean_bound=5,
                 reward_bound=495.0,
                 save_model=10):
        """
        Constructor of the agent class.
            - game="CartPole-v1" : Name of the game environment
            - mean_bound=5 : Number of last acquired rewards considered for mean reward
            - reward_bound=495.0 : Reward acquired for completing an episode properly
            - save_model=10 : Interval for saving the model

            - p : Percentile for selecting training data
            - lr : Learning rate for the CE model
        """

        # Environment variables
        self.game = game
        self.env = gym.make(self.game)
        self.num_states = self.env.observation_space.shape[0]
        self.num_actions = self.env.action_space.n

        # Agent variables
        self.p = p * 100
        self.mean_bound = mean_bound
        self.reward_bound = reward_bound

        # DQN variables
        self.lr = lr
        self.model = DNN(self.num_states, self.num_actions, self.lr)
        self.save_model = save_model

        # File paths
        directory = os.path.dirname(__file__)
        self.path_model = os.path.join(directory, "../models/dnn.h5")
        self.path_plot = os.path.join(directory, "../plots/dnn.png")

        # Load model, if it already exists
        try:
            self.model.load(self.path_model)
        except:
            print(f"Model does not exist! Create new model...")

    def get_action(self, state):
        """
        Returns an action for a given state, based on the current policy.
            - state : Current state of the agent
        """

        state = state.reshape(1, -1)
        policy = self.model.predict(state)[0]
        action = np.random.choice(self.num_actions, p=policy)

        return action

    def sample(self, num_episodes):
        """
        Returns samples of state/action tuples for a given number of episodes.
            - num_episodes : Number of episodes to sample
        """

        episodes = [[] for _ in range(num_episodes)]
        rewards = [0.0 for _ in range(num_episodes)]

        for episode in range(num_episodes):
            state = self.env.reset()
            total_reward = 0.0

            while True:
                action = self.get_action(state)
                next_state, reward, done, _ = self.env.step(action)
                episodes[episode].append((state, action))
                state = next_state

                # Penalize agent if pole could not be balanced until end of episode.
                if done and reward < 499.0:
                    reward = -100.0

                total_reward += reward

                if done:
                    total_reward += 100.0
                    rewards[episode] = total_reward
                    break

        return rewards, episodes

    def get_training_data(self, episodes, rewards):
        """
        Returns training data for the CE model.
            - episodes : List of state/action tuples
            - rewards : List of gained rewards
        """

        x_train, y_train = [], []
        reward_bound = np.percentile(rewards, self.p)

        for episode, reward in zip(episodes, rewards):
            if reward >= reward_bound:
                states = [step[0] for step in episode]
                actions = [step[1] for step in episode]
                x_train.extend(states)
                y_train.extend(actions)

        x_train = np.asarray(x_train)
        y_train = to_categorical(y_train, num_classes=self.num_actions)

        return x_train, y_train, reward_bound

    def train(self, num_epochs, num_episodes, report_interval):
        """
        Trains the CE model for a given number of epochs and episodes. Outputting report information is controlled by a given time interval.
            - num_epochs : Number of epochs to train
            - num_episodes : Number of episodes to train
            - report_interval : Interval for outputting report information of training
        """

        total_rewards = []

        for epoch in range(1, num_epochs + 1):
            if epoch % self.save_model == 0:
                self.model.save(self.path_model)

            rewards, episodes = self.sample(num_episodes)
            x_train, y_train, reward_bound = self.get_training_data(
                episodes, rewards)

            mean_reward = np.mean(rewards)
            total_rewards.extend(rewards)
            mean_total_reward = np.mean(total_rewards[-self.mean_bound:])

            if epoch % report_interval == 0:
                print(f"Epoch: {epoch + 1}/{num_epochs}"
                      f"\tMean Reward: {mean_reward : .2f}"
                      f"\tReward Bound: {reward_bound : .2f}")

                self.plot_rewards(total_rewards)

            if mean_total_reward > self.reward_bound:
                self.model.save(self.path_model)

            self.model.fit(x_train, y_train)

        self.model.save(self.path_model)

    def play(self, num_episodes):
        for episode in range(1, num_episodes + 1):
            state = self.env.reset()
            total_reward = 0.0

            while True:
                self.env.render()
                action = self.get_action(state)
                state, reward, done, _ = self.env.step(action)
                total_reward += reward

                if done:
                    print(f"Episode: {episode + 1}/{num_episodes}"
                          f"\tReward: {total_reward : .2f}")

                    break

    def plot_rewards(self, total_rewards):
        x = range(len(total_rewards))
        y = total_rewards

        slope, intercept, _, _, _ = linregress(x, y)

        plt.plot(x, y, linewidth=0.8)
        plt.plot(x, slope * x + intercept, color="red", linestyle="-.")
        plt.xlabel("Episode")
        plt.ylabel("Reward")
        plt.title("CE-Learning")
        plt.savefig(self.path_plot)

Ejemplo n.º 2

Mostrar archivo

Archivo: main.py Proyecto: alokrkmv/test_tensorflow_ddi_projects

                zerotrain = zerotrain + 1
                train_label_new.append(0)
            else:
                nozerotrain = nozerotrain + 1
                train_label_new.append(1)

        prefilter_train = np.concatenate((train1, train2), axis=1)
        prefilter_test = np.concatenate((test1, test2), axis=1)

        train_label_new_forDNN = np.array([[0, 1] if i == 1 else [1, 0] for i in train_label_new])

        test_label_new_forDNN = np.array([[0, 1] if i == 1 else [1, 0] for i in real_labels])

        model_DNN = DNN()
        model_DNN.fit(prefilter_train, train_label_new_forDNN, epochs=30, batch_size=200)
        model_DNN.save("my_model")
        # model_DNN = models.load_model("my_model")
        print(model_DNN.summary())
        print(model_DNN.summary())
        proba = model_DNN.predict_classes(prefilter_test, batch_size=200, verbose=True)
        ae_y_pred_prob = model_DNN.predict_proba(prefilter_test, batch_size=200, verbose=True)
        acc, precision, sensitivity, specificity, MCC = calculate_performace(len(real_labels), proba, real_labels)
        fpr, tpr, auc_thresholds = roc_curve(real_labels, ae_y_pred_prob[:, 1])
        auc_score = auc(fpr, tpr)

        precision1, recall, pr_threshods = precision_recall_curve(real_labels, ae_y_pred_prob[:, 1])
        aupr_score = auc(recall, precision1)
        # f = f1_score(real_labels, transfer_label_from_prob(ae_y_pred_prob[:,1]))
        all_F_measure = np.zeros(len(pr_threshods))

        print(auc_score)