Python RNN.cuda Examples

Programming Language: Python

Namespace/Package Name: RNN

Class/Type: RNN

Method/Function: cuda

Examples at hotexamples.com: 3

Python RNN.cuda - 3 examples found. These are the top rated real world Python examples of RNN.RNN.cuda extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

RNN(30)

parameters(8)

predict(7)

load_state_dict(6)

state_dict(5)

eval(5)

test(4)

load(3)

save(3)

cuda(3)

init_weights(3)

fit(2)

set_weights(2)

build_model(2)

load_from_file(2)

forwardPropagation(2)

synthesize(2)

save_to_file(2)

layapunovFunction(1)

inverse_transform(1)

loss(1)

h0(1)

opt(1)

Persistent_opt(1)

plot_loss(1)

gradientCheck(1)

prepare_data(1)

reset(1)

reset_state(1)

saveNeuralNet(1)

score_fine(1)

search(1)

sgd(1)

sgdStep(1)

sgd_step(1)

h(1)

gradBy(1)

gradWxh(1)

calc_loss(1)

__plot_prediction__(1)

__plot_total_loss__(1)

__test__(1)

__train__(1)

addLayer(1)

backprop(1)

backprop_thru_time_chain(1)

backprop_thru_time_double_loop(1)

backprop_thru_time_lagrange(1)

backprop_thru_time_lagrange_loop(1)

backward(1)

Example #1

Show file

    #datapre = DataLoader(train_dir, vocab, transform)
    #data = datapre.gen_data()
    data = dataloader(train_dir, vocab, transform)
    print('train data loaded')

    #set up CNN and RNN
    cnn = CNN(embedding_size=embedding_size)
    rnn = RNN(embedding_dim=embedding_size,
              hidden_dim=hidden_size,
              vocab_size=vocab.index)

    #running with CUDA
    if torch.cuda.is_available():
        with torch.cuda.device(gpu_device):
            cnn.cuda()
            rnn.cuda()

    # set up loss function and optimizer
    criterion = nn.CrossEntropyLoss()
    params = list(cnn.linear.parameters()) + list(rnn.parameters())
    optimizer = torch.optim.Adam(params, lr=learning_rate)
    losses, iter = [], []
    n = 0

    # training
    print('start training')
    for epoch in range(epochs):
        #img_sf, cap_sf = shuffle_data(data, seed= epoch)
        img_sf, cap_sf = data.shuffle(seed=epoch)
        cap_len = len(cap_sf)
        loss_tot = []

Example #2

Show file

                                           drop_last=True,
                                           shuffle=True)
test_loader = torch.utils.data.DataLoader(DataUtils.ECGDataset(train_path,
                                                               test_path,
                                                               test=True),
                                          batch_size=args.test_batch_size,
                                          drop_last=True,
                                          shuffle=True)
#model = LSTM(28*28, 64, 10) MNIST dataset
#model = LSTM(140, 64, 5)
#model = FC(28 * 28, 300, 100, 10)
#model = TTRNN([4,7,4,7], [4,2,4,4], [1,3,4,2,1], 1, 0.8, 'ttgru')
#model = RNN([2,5,2,7], [4,4,2,4], [1,2,5,3,1], 0.8, 5)
model = RNN([1, 5, 2, 1], [2, 2, 2, 2], [1, 2, 2, 2, 1], 0.8, 5)
if args.cuda:
    model.cuda()
optimizer = TorchOptim.Adam(model.parameters(), lr=args.lr)


def train(epoch):
    #model.train()
    for step, data in enumerate(train_loader):
        train = data[0]
        target = data[1].type(torch.LongTensor)
        sequence_length = data[2] / args.feature_size
        if args.cuda:
            data, target = train.cuda(), target.cuda()
        #data, target = TorchAutograd.Variable(data), TorchAutograd.Variable(target)
        output = model(data.view(args.train_batch_size, -1,
                                 args.feature_size).float(),
                       lengths=sequence_length)

Example #3

Show file

class Trainer:
    def __init__(self, TRAIN_CONFIGS, GRU_CONFIGS, FFN_CONFIGS=None):
        self.TRAIN_CONFIGS = TRAIN_CONFIGS
        self.GRU_CONFIGS = self._process_gru_configs(GRU_CONFIGS)
        self.model = RNN(target=TRAIN_CONFIGS['target'],
                         **self.GRU_CONFIGS,
                         FFN_CONFIGS=FFN_CONFIGS)
        self.epochs_trained = 0
        self.trained = False
        # Storage for later
        self.loss = self.val_loss = self.train_y_hat = self.train_y_true = self.val_y_hat = self.val_y_true = None

    def _process_gru_configs(self, GRU_CONFIGS):
        lti = self._load_data_source
        HIDDEN_SIZE = lti.A.shape[-1]
        INPUT_SIZE = 1 if lti.B is None else lti.U.shape[-1]
        GRU_IMPLIED_CONFIGS = {
            "hidden_size": lti.A.shape[-1],
            "input_size": 1 if lti.B is None else lti.U.shape[-1]
        }
        GRU_CONFIGS.update(GRU_IMPLIED_CONFIGS)
        return GRU_CONFIGS

    @property
    def _load_data_source(self):
        data_dir = self.TRAIN_CONFIGS.get("data_dir")
        lti_file = self.TRAIN_CONFIGS.get("lti_file")
        with open(path.join(data_dir, lti_file), "rb") as f:
            lti = pickle.load(f)
        return lti

    @property
    def _load_train_data(self):
        def unsqueeze(*args):
            return (_unsqueeze(M) for M in args)

        def _unsqueeze(M):
            if not M is None:
                M = M.unsqueeze(-2)
            return M

        lti = self._load_data_source
        Y, H, X, h0 = lti.torch
        _Y, _H, _X = unsqueeze(Y, H, X)
        _h0 = None if self.TRAIN_CONFIGS.get(
            "init_h") == False else h0.reshape(self.GRU_CONFIGS["num_layers"],
                                               1,
                                               self.GRU_CONFIGS["hidden_size"])
        return _Y, _H, _X, _h0

    @property
    def fit(self):
        if self.trained == False:
            # get configs (for readability)
            nEpochs = self.TRAIN_CONFIGS['epochs']
            train_steps = self.TRAIN_CONFIGS['train_steps']
            init_h = self.TRAIN_CONFIGS['init_h']
            base = self.TRAIN_CONFIGS['base']
            # load data
            Y, H, X, h0 = tensor_to_cuda(*self._load_train_data)
            # split data
            if self.TRAIN_CONFIGS['target'] == 'states':
                y_train, y_val = H[:train_steps], H[train_steps:]
            elif self.TRAIN_CONFIGS['target'] == 'outputs':
                y_train, y_val = Y[:train_steps], Y[train_steps:]
            x_train, x_val = X[:train_steps], X[train_steps:]
            # prep model and optimizers
            self.model.cuda()
            optimizer = optim.Adam(self.model.parameters(), lr=1e-3)
            scheduler = optim.lr_scheduler.ReduceLROnPlateau(optimizer,
                                                             patience=2)
            # trian
            loss = [None] * nEpochs
            val_loss = [None] * nEpochs
            pbar = tqdm(total=nEpochs, leave=False)
            for i in range(nEpochs):
                # reset gradient
                optimizer.zero_grad()
                # generate prediction
                y_hat, h_plus1 = self.model(
                    x_train) if not init_h else self.model(x_train, h0)
                y_hat = y_hat.squeeze()
                # calculate loss
                l = loss_func(y_hat,
                              y_train,
                              base=self.TRAIN_CONFIGS['base'],
                              epoch=i)
                loss[i] = l.item()
                # learn from loss
                l.backward()
                optimizer.step()
                scheduler.step(l.item())
                # validate
                with torch.no_grad():
                    val_y_hat, _ = self.model(
                        x_val) if not init_h else self.model(x_val, h_plus1)
                    val_y_hat = val_y_hat.squeeze()
                    l = loss_func(val_y_hat,
                                  y_val,
                                  base=self.TRAIN_CONFIGS['base'],
                                  epoch=i)
                    val_loss[i] = l.item()
                # decorator
                pbar.set_description(
                    f"Loss={loss[i]:.3f}. Val={val_loss[i]:.3f}")
                pbar.update(1)

            pbar.close()
            self.epochs_trained += nEpochs

            self.loss, self.val_loss = loss, val_loss
            self.train_y_hat, self.train_y_true = y_hat.detach().cpu().squeeze(
            ), y_train.detach().cpu().squeeze()
            self.val_y_hat, self.val_y_true = val_y_hat.detach().cpu().squeeze(
            ), y_val.detach().cpu().squeeze()
            self.trained = True
        else:
            # this shouldn't ever be reached. It's a safety.
            raise ValueError("Model has already been trained.")
        return (self.loss, self.val_loss), \
               (self.train_y_hat, self.train_y_true), \
               (self.val_y_hat, self.val_y_true)

    def pickle_save(self, trial_num):
        p = Trainer._pickle_path(self.TRAIN_CONFIGS, trial_num)
        with open(p, "wb") as f:
            pickle.dump(self, f)

    # TODO remove
    # def _gen_relative_graphs(self, hat, true, dimH, val_begins, trial_num=0, fname_prefix=None, freq=10):
    #     Trainer.gen_relative_graphs(hat, true, dimH, val_begins, trial_num, self.TRAIN_CONFIGS.get("fig_dir"), fname_prefix, freq)

    @staticmethod
    def pickled_exists(TRAIN_CONFIGS, trial_num):
        p = Trainer._pickle_path(TRAIN_CONFIGS, trial_num)
        return path.exists(p)

    @staticmethod
    def _pickle_path(TRAIN_CONFIGS, trial_num):
        name = Trainer.model_name(TRAIN_CONFIGS, trial_num)
        if not np.char.endswith(name, ".pickle"):
            name += ".pickle"
        model_dir = TRAIN_CONFIGS.get("model_dir")
        return path.join(model_dir, name)

    @staticmethod
    def _gen_relative_graphs(hat,
                             true,
                             dimOut,
                             val_begins,
                             trial_num,
                             isState,
                             fig_dir=None,
                             fname_prefix=None,
                             freq=10,
                             pause=False):
        val_ends = hat.shape[0]
        palette = {
            "H1": "C0",
            "H2": "C1",
            "H3": "C2",
            "Y1": "C0",
            "Y2": "C1",
            "Y3": "C2"
        }
        for _base in range(dimOut):
            _dif = rel_space_dif(hat, true, _base)
            df = pd.DataFrame(_dif)
            df = df.drop(_base, axis=1)
            _pre = "H" if isState else "Y"
            df.columns = _pre + (df.columns + 1).astype(str)
            df.columns.name = "Hidden States" if isState else "Output Indices"
            df.index.name = "Itteration"
            df = df.stack()
            df.name = "Error"
            df = df.reset_index()
            _df = df[df['Itteration'] % freq == 0]
            plt.axhline(0, color="k", alpha=0.5)
            _hue = "Hidden States" if isState else "Output Indices"
            sns.lineplot(data=_df,
                         x="Itteration",
                         y="Error",
                         hue=_hue,
                         alpha=1,
                         palette=palette)

            plt.title(f"Relative Difference (Base: {_pre}{_base+1})")
            plt.axvspan(val_begins, val_ends, facecolor="0.1", alpha=0.25)
            if not fname_prefix is None and not fig_dir is None:
                fname = fname_prefix + f"-relgraph-{_pre}{_base+1}-trial{trial_num}"
                f = path.join(fig_dir, fname)
                plt.savefig(path.join(fig_dir, fname))
            else:
                print(f"fname_prefix='{fname_prefix}'; fig_dir='{fig_dir}'")
            if pause:
                plt.show()
            else:
                plt.show(block=False)
            plt.clf()

    @staticmethod
    def model_name(TRAIN_CONFIGS, trial_num):
        fprefix = TRAIN_CONFIGS.get("lti_file").split(".")[0]
        name = fprefix + f"-trial{trial_num}"
        return name

    @staticmethod
    def load_trained(TRAIN_CONFIGS, trial_num):
        model_dir = TRAIN_CONFIGS.get("model_dir")
        name = Trainer.model_name(TRAIN_CONFIGS, trial_num)
        if not np.char.endswith(name, ".pickle"):
            name += ".pickle"
        with open(path.join(model_dir, name), "rb") as f:
            trainer = pickle.load(f)
        return trainer

    def gen_relative_graphs(self, trial_num, freq=10, pause=False):
        train_hat, train_true, val_hat, val_true = self.train_y_hat, self.train_y_true, self.val_y_hat, self.val_y_true
        # derived
        dimOut = train_hat.shape[-1]
        val_begins = train_hat.shape[0]
        # combine predictions and true values
        hat = np.concatenate([train_hat, val_hat])
        true = np.concatenate([train_true, val_true])
        # graph
        fprefix = self.TRAIN_CONFIGS.get("lti_file").split(".pickle")[0]

        isState = self.TRAIN_CONFIGS.get("target") == "state"
        Trainer._gen_relative_graphs(hat,
                                     true,
                                     dimOut,
                                     val_begins,
                                     trial_num,
                                     isState,
                                     self.TRAIN_CONFIGS.get("fig_dir"),
                                     fprefix,
                                     freq=10,
                                     pause=False)

    @property
    def get_train_test_metrics(self):
        isState = self.TRAIN_CONFIGS.get("target") == "state"

        state_tups = [(self.train_y_hat, self.train_y_true),
                      (self.val_y_hat, self.val_y_true)]
        train, test = [
            all_state_metrics(state_hat, state_true, isState)
            for state_hat, state_true in state_tups
        ]

        return train, test

    def save_train_test_metrics(self, trial_num):
        metrics_dir = self.TRAIN_CONFIGS.get("metrics_dir")

        train, test = self.get_train_test_metrics
        _name = Trainer.model_name(self.TRAIN_CONFIGS, trial_num)

        train.to_csv(path.join(metrics_dir, _name + "-train.csv"))
        test.to_csv(path.join(metrics_dir, _name + "-val.csv"))

        return train, test