示例#1
0
    L_pck_mat = L_pck[0].expand_as(point_distance)
    correct_points = torch.le(point_distance, L_pck_mat * alpha)
    pck = torch.mean(correct_points.float())
    return pck


# Training
best_pck = 0
for ep in range(args.epochs):
    scheduler.step()
    log('Current epoch : %d\n' % ep, LOGGER_FILE)
    log(
        'Current learning rate : %e\n' %
        optimizer.state_dict()['param_groups'][0]['lr'], LOGGER_FILE)

    net.train()
    net.feature_extraction.eval()
    total_loss = 0
    for i, batch in enumerate(train_loader):
        src_image = batch['image1'].to(device)
        tgt_image = batch['image2'].to(device)
        GT_src_mask = batch['mask1'].to(device)
        GT_tgt_mask = batch['mask2'].to(device)

        output = net(src_image, tgt_image, GT_src_mask, GT_tgt_mask)

        optimizer.zero_grad()
        loss, L1, L2, L3 = criterion(output, GT_src_mask, GT_tgt_mask)
        loss.backward()
        optimizer.step()
        total_loss += loss.item()
示例#2
0
def main(args):

    ts = time.strftime("%Y-%b-%d-%H-%M-%S", time.gmtime())

    data_config = load_config_from_json(args.data_config_path)
    model_config = load_config_from_json(args.model_config_path)

    splits = ["train", "valid"]

    datasets = OrderedDict()
    for split in splits:
        datasets[split] = ModCloth(data_config, split=split)

    # initialize model
    model = SFNet(model_config["sfnet"])
    model = model.to(device)

    print("-" * 50)
    print(model)
    print("-" * 50)
    print("Number of model parameters: {}".format(
        sum(p.numel() for p in model.parameters())))
    print("-" * 50)

    save_model_path = os.path.join(
        model_config["logging"]["save_model_path"],
        model_config["logging"]["run_name"] + ts,
    )
    os.makedirs(save_model_path)

    if model_config["logging"]["tensorboard"]:
        writer = SummaryWriter(os.path.join(save_model_path, "logs"))
        writer.add_text("model", str(model))
        writer.add_text("args", str(args))

    loss_criterion = torch.nn.CrossEntropyLoss(reduction="mean")

    optimizer = torch.optim.Adam(
        model.parameters(),
        lr=model_config["trainer"]["optimizer"]["lr"],
        weight_decay=model_config["trainer"]["optimizer"]["weight_decay"],
    )

    step = 0
    tensor = torch.cuda.FloatTensor if torch.cuda.is_available(
    ) else torch.Tensor

    for epoch in range(model_config["trainer"]["num_epochs"]):

        for split in splits:

            data_loader = DataLoader(
                dataset=datasets[split],
                batch_size=model_config["trainer"]["batch_size"],
                shuffle=split == "train",
            )

            loss_tracker = defaultdict(tensor)

            # Enable/Disable Dropout
            if split == "train":
                model.train()
            else:
                model.eval()
                target_tracker = []
                pred_tracker = []

            for iteration, batch in enumerate(data_loader):

                for k, v in batch.items():
                    if torch.is_tensor(v):
                        batch[k] = to_var(v)

                # Forward pass
                logits, pred_probs = model(batch)

                # loss calculation
                loss = loss_criterion(logits, batch["fit"])

                # backward + optimization
                if split == "train":
                    optimizer.zero_grad()
                    loss.backward()
                    optimizer.step()
                    step += 1

                # bookkeepeing
                loss_tracker["Total Loss"] = torch.cat(
                    (loss_tracker["Total Loss"], loss.view(1)))

                if model_config["logging"]["tensorboard"]:
                    writer.add_scalar(
                        "%s/Total Loss" % split.upper(),
                        loss.item(),
                        epoch * len(data_loader) + iteration,
                    )

                if iteration % model_config["logging"][
                        "print_every"] == 0 or iteration + 1 == len(
                            data_loader):
                    print("{} Batch Stats {}/{}, Loss={:.2f}".format(
                        split.upper(), iteration,
                        len(data_loader) - 1, loss.item()))

                if split == "valid":
                    target_tracker.append(batch["fit"].cpu().numpy())
                    pred_tracker.append(pred_probs.cpu().data.numpy())

            print("%s Epoch %02d/%i, Mean Total Loss %9.4f" % (
                split.upper(),
                epoch + 1,
                model_config["trainer"]["num_epochs"],
                torch.mean(loss_tracker["Total Loss"]),
            ))

            if model_config["logging"]["tensorboard"]:
                writer.add_scalar(
                    "%s-Epoch/Total Loss" % split.upper(),
                    torch.mean(loss_tracker["Total Loss"]),
                    epoch,
                )

            # Save checkpoint
            if split == "train":
                checkpoint_path = os.path.join(save_model_path,
                                               "E%i.pytorch" % (epoch + 1))
                torch.save(model.state_dict(), checkpoint_path)
                print("Model saved at %s" % checkpoint_path)

        if split == "valid" and model_config["logging"]["tensorboard"]:
            # not considering the last (incomplete) batch for metrics
            target_tracker = np.stack(target_tracker[:-1]).reshape(-1)
            pred_tracker = np.stack(pred_tracker[:-1], axis=0).reshape(
                -1, model_config["sfnet"]["num_targets"])
            precision, recall, f1_score, accuracy, auc = compute_metrics(
                target_tracker, pred_tracker)

            writer.add_scalar("%s-Epoch/Precision" % split.upper(), precision,
                              epoch)
            writer.add_scalar("%s-Epoch/Recall" % split.upper(), recall, epoch)
            writer.add_scalar("%s-Epoch/F1-Score" % split.upper(), f1_score,
                              epoch)
            writer.add_scalar("%s-Epoch/Accuracy" % split.upper(), accuracy,
                              epoch)
            writer.add_scalar("%s-Epoch/AUC" % split.upper(), auc, epoch)

    # Save Model Config File
    with jsonlines.open(os.path.join(save_model_path, "config.jsonl"),
                        "w") as fout:
        fout.write(model_config)