Пример #1
0
def perform_testing():

    print('--- Performing Oracle Evaluation ---')
    testing_data_dict = helpers.csv_to_dict(training=False)
    keys = list(testing_data_dict.keys())
    testing_key = keys[0]  # Validate on the second composer
    print('Testing on: ' + ' '.join(testing_key))
    # Get data
    _, y_annotated, _ = helpers.fetch_data(testing_data_dict, testing_key)

    # Get data dictionary
    training_data_dict = helpers.csv_to_dict(training=True)
    training_keys = sorted(list(training_data_dict.keys()))[2]
    print('Using predictions from: ' + " ".join(training_keys))
    # Get data
    _, y_noisy, _ = helpers.fetch_data(training_data_dict, training_keys)

    res = prf(y_annotated, y_noisy, average='binary')
    cls_error = np.sum(
        np.abs(y_annotated - y_noisy)) / np.shape(y_annotated)[0] * 100.

    print('Precision: %2f' % res[0])
    print('Recall: %2f' % res[1])
    print('Fscore: %2f' % res[2])
    print('Error: %2f' % cls_error)

    return None
Пример #2
0
def perform_training():
    # Check if saving path exists
    if not (os.path.isdir(
            os.path.join("results/" + exp_settings['split_name']))):
        print(
            'Saving directory was not found... Creating a new folder to store the results!'
        )
        os.makedirs(os.path.join("results/" + exp_settings['split_name']))

    # Get data dictionary
    data_dict = helpers.csv_to_dict(training=True)
    training_keys = sorted(list(
        data_dict.keys()))[0:exp_settings['split_training_indx']]
    print('Training on: ' + " ".join(training_keys))

    # Get data
    x, y, _ = helpers.fetch_data(data_dict, training_keys)
    x *= 0.99 / np.max(np.abs(x))

    d_p_length_samples = exp_settings['d_p_length'] * exp_settings[
        'fs']  # Length in samples

    # Initialize NN modules
    dropout = torch.nn.Dropout(exp_settings['drp_rate']).cuda()
    win_viz, _ = visualize.init_visdom()  # Web loss plotting
    dft_analysis, mel_analysis, pcen, gru_enc, gru_dec, fc_layer, label_smoother = build_model(
        flag='training')

    # Criterion
    bce_func = torch.nn.BCEWithLogitsLoss(size_average=True)

    # Initialize optimizer and add the parameters that will be updated
    if exp_settings['end2end']:
        parameters_list = list(dft_analysis.parameters()) + list(mel_analysis.parameters()) + list(pcen.parameters())\
                          + list(gru_enc.parameters()) + list(gru_dec.parameters()) + list(fc_layer.parameters())
    else:
        parameters_list = list(pcen.parameters()) + list(gru_enc.parameters())\
                          + list(gru_dec.parameters()) + list(fc_layer.parameters())

    optimizer = torch.optim.Adam(parameters_list, lr=1e-4)
    scheduler_n = StepLR(optimizer,
                         1,
                         gamma=exp_settings['learning_rate_drop'])
    scheduler_p = StepLR(optimizer,
                         1,
                         gamma=exp_settings['learning_date_incr'])

    # Start of the training
    batch_indx = 0
    number_of_data_points = len(x) // d_p_length_samples
    prv_cls_error = 100.
    best_error = 50.
    for epoch in range(1, exp_settings['epochs'] + 1):
        # Validation
        if not epoch == 1:
            cls_err = perform_validation([
                dft_analysis, mel_analysis, pcen, gru_enc, gru_dec, fc_layer,
                label_smoother
            ])

            if prv_cls_error - cls_err > 0:
                # Increase learning rate
                scheduler_p.step()
                if cls_err < best_error:
                    # Update best error
                    best_error = cls_err
                    print('--- Saving Model ---')
                    torch.save(
                        pcen.state_dict(),
                        os.path.join('results', exp_settings['split_name'],
                                     'en_pcen_bs_drp.pytorch'))
                    torch.save(
                        gru_enc.state_dict(),
                        os.path.join('results', exp_settings['split_name'],
                                     'en_gru_enc_bs_drp.pytorch'))
                    torch.save(
                        gru_dec.state_dict(),
                        os.path.join('results', exp_settings['split_name'],
                                     'en_gru_dec_bs_drp.pytorch'))
                    torch.save(
                        fc_layer.state_dict(),
                        os.path.join('results', exp_settings['split_name'],
                                     'en_cls_bs_drp.pytorch'))
            else:
                # Decrease learning rate
                scheduler_n.step()

            # Update classification error
            prv_cls_error = cls_err

        # Shuffle between sequences
        shuffled_data_points = np.random.permutation(
            np.arange(0, number_of_data_points))

        # Constructing batches
        available_batches = len(
            shuffled_data_points) // exp_settings['batch_size']
        for batch in tqdm(range(available_batches)):
            x_d_p, y_d_p = helpers.gimme_batches(batch, shuffled_data_points,
                                                 x, y)
            x_cuda = torch.autograd.Variable(
                torch.from_numpy(x_d_p).cuda(),
                requires_grad=False).float().detach()
            y_cuda = torch.autograd.Variable(
                torch.from_numpy(y_d_p).cuda(),
                requires_grad=False).float().detach()

            # Forward analysis pass: Input data
            x_real, x_imag = dft_analysis.forward(x_cuda)
            # Magnitude computation
            mag = torch.sqrt(x_real.pow(2) + x_imag.pow(2))

            # Mel analysis
            mel_mag = torch.autograd.Variable(mel_analysis.forward(mag).data,
                                              requires_grad=True).cuda()

            # Learned normalization
            mel_mag_pr = pcen.forward(mel_mag)

            # GRUs
            dr_mel_p = dropout(mel_mag_pr)
            h_enc = gru_enc.forward(dr_mel_p)
            h_dec = gru_dec.forward(h_enc)
            # Classifier
            _, vad_prob = fc_layer.forward(h_dec, mel_mag_pr)

            # Target data preparation
            y_true = label_smoother.forward(y_cuda).detach()
            vad_true = torch.autograd.Variable(y_true.data,
                                               requires_grad=True).cuda()

            # Loss
            loss = bce_func(vad_prob, vad_true)

            # Optimization
            optimizer.zero_grad()
            loss.backward()
            torch.nn.utils.clip_grad_norm(parameters_list,
                                          max_norm=60,
                                          norm_type=2)
            optimizer.step()

            # Update graph
            win_viz = visualize.viz.line(X=np.arange(batch_indx,
                                                     batch_indx + 1),
                                         Y=np.reshape(loss.data[0], (1, )),
                                         win=win_viz,
                                         update='append')
            batch_indx += 1

    return None
Пример #3
0
def perform_cluster_visualization(singers=True):
    print('--- Performing Visualization ---')
    nn_list = list(build_model(flag='testing'))
    data_dict = helpers.csv_to_dict(training=False)
    keys = list(data_dict.keys())
    testing_key = keys[0]  # Validate on the second composer
    print('Testing on: ' + ' '.join(testing_key))
    # Get data
    x, y, fs, singer_id_list = helpers.fetch_data_with_singer_ids(
        data_dict, testing_key)
    x *= 0.99 / np.max(np.abs(x))
    sigmoid = torch.nn.Sigmoid()  # Label helper!
    d_p_length_samples = exp_settings['d_p_length'] * exp_settings[
        'fs']  # Length in samples

    number_of_data_points = len(x) // d_p_length_samples
    for data_point in tqdm(range(number_of_data_points)):
        # Generate data
        x_d_p = x[data_point * d_p_length_samples:(data_point + 1) *
                  d_p_length_samples]
        y_d_p = y[data_point * d_p_length_samples:(data_point + 1) *
                  d_p_length_samples, :]
        # Reshape data
        x_d_p = x_d_p.reshape(1, d_p_length_samples)
        y_d_p = y_d_p.reshape(1, d_p_length_samples,
                              exp_settings['clust_dim'] + 1)
        x_cuda = torch.autograd.Variable(torch.from_numpy(x_d_p).cuda(),
                                         requires_grad=False).float().detach()
        y_cuda = torch.autograd.Variable(torch.from_numpy(y_d_p).cuda(),
                                         requires_grad=False).float().detach()

        # Forward analysis pass: Input data
        x_real, x_imag = nn_list[0].forward(x_cuda)
        # Magnitude computation
        mag = torch.norm(torch.cat((x_real, x_imag), 0), 2, dim=0).unsqueeze(0)
        # Mel analysis
        mel_mag = torch.autograd.Variable(nn_list[1].forward(mag).data,
                                          requires_grad=False)

        # Learned normalization
        mel_mag_pr = nn_list[2].forward(mel_mag)
        # GRUs
        h_enc = nn_list[3].forward(mel_mag_pr)
        h_dec = nn_list[4].forward(h_enc)
        # Classifier
        mel_filt, vad_prob, cl_space = nn_list[5].forward(h_dec,
                                                          mel_mag_pr,
                                                          ld_space=True)
        vad_prob = sigmoid(vad_prob)
        vad_prob = vad_prob.gt(0.51).float().data.cpu().numpy()[0, :, 0]
        cl_space = cl_space.data.cpu().numpy()[0, :]

        # Target data preparation
        y_true = nn_list[6].forward(y_cuda).detach().gt(
            0.5).float().data.cpu().numpy()[0, :, 0]
        if data_point == 0:
            out_space = cl_space
            out_true_prob = y_true
            out_vad_prob = vad_prob
        else:
            out_space = np.vstack((out_space, cl_space))
            out_true_prob = np.hstack((out_true_prob, y_true))
            out_vad_prob = np.hstack((out_vad_prob, vad_prob))

    # Scatter plot
    fig = plt.figure()
    ax = Axes3D(fig)
    silence_examples = np.where(out_true_prob == 0)[0]

    ax.scatter(out_space[silence_examples, 0],
               out_space[silence_examples, 1],
               out_space[silence_examples, 2],
               c='black',
               s=0.5,
               vmax=1,
               vmin=-1,
               label='Silence',
               alpha=0.7)

    if singers:
        hunding_examples = np.where(out_true_prob[:, 1] == 1)[0]
        sieglinde_examples = np.where(out_true_prob[:, 2] == 1)[0]
        siegmund_examples = np.where(out_true_prob[:, 3] == 1)[0]

        ax.scatter(out_space[hunding_examples, 0],
                   out_space[hunding_examples, 1],
                   out_space[hunding_examples, 2],
                   c='red',
                   s=0.5,
                   vmax=1,
                   vmin=-1,
                   label='Hunding',
                   alpha=0.7)
        ax.scatter(out_space[sieglinde_examples, 0],
                   out_space[sieglinde_examples, 1],
                   out_space[sieglinde_examples, 2],
                   c='cyan',
                   s=0.5,
                   vmax=1,
                   vmin=-1,
                   label='Sieglinde',
                   alpha=0.7)
        ax.scatter(out_space[siegmund_examples, 0],
                   out_space[siegmund_examples, 1],
                   out_space[siegmund_examples, 2],
                   c='magenta',
                   s=0.5,
                   vmax=1,
                   vmin=-1,
                   label='Siegmund',
                   alpha=0.7)
    else:
        active_examples = np.where(out_true_prob == 1)[0]
        ax.scatter(out_space[active_examples, 0],
                   out_space[active_examples, 1],
                   out_space[active_examples, 2],
                   c='red',
                   s=0.5,
                   vmax=1,
                   vmin=-1,
                   label='Singing Voice',
                   alpha=0.7)

    ax.legend()
    ax.set_title('Low Dimensional Latent Space')
    ax.set_xlabel('x-axis')
    ax.set_ylabel('y-axis')
    ax.set_zlabel('z-axis')
    ax.view_init(elev=-141, azim=21)
    plt.savefig('/home/mis/GRU_PCEN.png', dpi=400)
    plt.show(block=False)

    return None
Пример #4
0
def perform_testing():
    print('--- Performing Evaluation ---')
    nn_list = list(build_model(flag='testing'))
    data_dict = helpers.csv_to_dict(training=False)
    keys = list(data_dict.keys())
    testing_key = keys[0]  # Validate on the second composer
    print('Testing on: ' + ' '.join(testing_key))
    # Get data
    x, y, fs = helpers.fetch_data(data_dict, testing_key)
    x *= 0.99 / np.max(np.abs(x))

    sigmoid = torch.nn.Sigmoid()  # Label helper!
    d_p_length_samples = exp_settings['d_p_length'] * exp_settings[
        'fs']  # Length in samples

    number_of_data_points = len(x) // d_p_length_samples
    for data_point in tqdm(range(number_of_data_points)):
        # Generate data
        x_d_p = x[data_point * d_p_length_samples:(data_point + 1) *
                  d_p_length_samples]
        y_d_p = y[data_point * d_p_length_samples:(data_point + 1) *
                  d_p_length_samples]

        # Reshape data
        x_d_p = x_d_p.reshape(1, d_p_length_samples)
        y_d_p = y_d_p.reshape(1, d_p_length_samples)
        x_cuda = torch.autograd.Variable(torch.from_numpy(x_d_p),
                                         requires_grad=False).float().detach()
        y_cuda = torch.autograd.Variable(torch.from_numpy(y_d_p),
                                         requires_grad=False).float().detach()
        if torch.has_cudnn:
            x_cuda = x_cuda.cuda()
            y_cuda = y_cuda.cuda()

        # Forward analysis pass: Input data
        x_real, x_imag = nn_list[0].forward(x_cuda)
        # Magnitude computation
        mag = torch.norm(torch.cat((x_real, x_imag), 0), 2, dim=0).unsqueeze(0)
        # Mel analysis
        mel_mag = torch.autograd.Variable(nn_list[1].forward(mag).data,
                                          requires_grad=False)

        # Learned normalization
        mel_mag_pr = nn_list[2].forward(mel_mag)
        # GRUs
        h_enc = nn_list[3].forward(mel_mag_pr)
        h_dec = nn_list[4].forward(h_enc)
        # Classifier
        _, vad_prob = nn_list[5].forward(h_dec, mel_mag_pr)
        vad_prob = sigmoid(vad_prob).gt(0.50).float().data.cpu().numpy()[0, :,
                                                                         0]

        # Up-sample the labels to the time-domain
        # Target data preparation
        vad_true = nn_list[6].forward(y_cuda).gt(
            0.50).float().data.cpu().numpy()[0, :, 0]

        if data_point == 0:
            out_prob = vad_prob
            out_true_prob = vad_true
        else:
            out_prob = np.hstack((out_prob, vad_prob))
            out_true_prob = np.hstack((out_true_prob, vad_true))

    res = prf(out_true_prob, out_prob, average='binary')
    cls_error = np.sum(
        np.abs(out_true_prob - out_prob)) / np.shape(out_true_prob)[0] * 100.
    voice_regions_percentage = (len(
        np.where(out_true_prob == 1)[0])) / np.shape(out_true_prob)[0] * 100.
    non_voice_regions_percentage = (len(
        np.where(out_true_prob == 0)[0])) / np.shape(out_true_prob)[0] * 100.

    print('Precision: %2f' % res[0])
    print('Recall: %2f' % res[1])
    print('Fscore: %2f' % res[2])
    print('Error: %2f' % cls_error)
    print('Singing voice frames percentage %2f' % voice_regions_percentage)
    print('Non-singing voice frames percentage %2f' %
          non_voice_regions_percentage)

    print('-- Saving Results --')
    np.save(
        os.path.join('results', exp_settings['split_name'],
                     'lr_pcen_results.npy'), out_prob)
    np.save(
        os.path.join('results', exp_settings['split_name'],
                     'vad_true_targets.npy'), out_true_prob)

    return None
Пример #5
0
def perform_validation(nn_list):
    print('--- Performing Validation ---')
    d_p_length_samples = exp_settings['d_p_length'] * exp_settings['fs']
    # Get data dictionary
    data_dict = helpers.csv_to_dict(training=True)
    keys = sorted(list(data_dict.keys()))
    validation_key = keys[exp_settings['split_validation_indx']]
    print('Validating on: ' + " ".join(validation_key))
    # Get data
    x, y, _ = helpers.fetch_data(data_dict, validation_key)
    x *= 0.99 / np.max(np.abs(x))

    sigmoid = torch.nn.Sigmoid()  # Label helper!

    # Constructing batches
    number_of_data_points = len(x) // d_p_length_samples
    available_batches = number_of_data_points // exp_settings['batch_size']
    data_points = np.arange(0, number_of_data_points)
    for batch in tqdm(range(available_batches)):
        x_d_p, y_d_p = helpers.gimme_batches(batch, data_points, x, y)

        x_cuda = torch.autograd.Variable(torch.from_numpy(x_d_p).cuda(),
                                         requires_grad=False).float().detach()
        y_cuda = torch.autograd.Variable(torch.from_numpy(y_d_p).cuda(),
                                         requires_grad=False).float().detach()

        # Forward analysis pass: Input data
        x_real, x_imag = nn_list[0].forward(x_cuda)
        # Magnitude computation
        mag = torch.sqrt(x_real.pow(2) + x_imag.pow(2))
        # Mel analysis
        mel_mag = torch.autograd.Variable(nn_list[1].forward(mag).data,
                                          requires_grad=True)

        # Learned normalization
        mel_mag_pr = nn_list[2].forward(mel_mag)
        # GRUs
        h_enc = nn_list[3].forward(mel_mag_pr)
        h_dec = nn_list[4].forward(h_enc)
        # Classifier
        _, vad_prob = nn_list[5].forward(h_dec, mel_mag_pr)
        vad_prob = sigmoid(vad_prob)
        vad_prob = vad_prob.gt(0.51).float().data.cpu().numpy()[:, :, 0]\
            .reshape(exp_settings['batch_size']*exp_settings['T'], 1)

        # Target data preparation
        y_true = nn_list[6].forward(y_cuda).detach()[:, :, 0]
        vad_true = y_true.gt(0.51).float().data.cpu().numpy().reshape(
            exp_settings['batch_size'] * exp_settings['T'], 1)

        if batch == 0:
            out_prob = vad_prob
            out_true_prob = vad_true
        else:
            out_prob = np.vstack((out_prob, vad_prob))
            out_true_prob = np.vstack((out_true_prob, vad_true))

    res = prf(out_true_prob, out_prob, average='binary')
    cls_error = np.sum(
        np.abs(out_true_prob - out_prob)) / len(out_true_prob) * 100.

    print('Precision: %2f' % res[0])
    print('Recall: %2f' % res[1])
    print('Fscore: %2f' % res[2])
    print('Error: %2f' % cls_error)

    return cls_error