checkNNGradients.py

from debugInitializeWeights import debugInitializeWeights
from computeNumericalGradient import computeNumericalGradient
from nnCostFunction import nnCostFunction, nnGradFunction
import numpy as np
    
def checkNNGradients(lmbda = 0):
#CHECKNNGRADIENTS Creates a small neural network to check the
#backpropagation gradients
#   CHECKNNGRADIENTS(lmbda) Creates a small neural network to check the
#   backpropagation gradients, it will output the analytical gradients
#   produced by your backprop code and the numerical gradients (computed
#   using computeNumericalGradient). These two gradient computations should
#   result in very similar values.
#
    
    input_layer_size = 3
    hidden_layer_size = 5
    num_labels = 3
    m = 5

    # We generate some 'random' test data
    Theta1 = debugInitializeWeights(hidden_layer_size, input_layer_size)
    Theta2 = debugInitializeWeights(num_labels, hidden_layer_size)
    # Reusing debugInitializeWeights to generate X
    X  = debugInitializeWeights(m, input_layer_size - 1)
    y  = 1 + np.mod(range(1, m + 1), num_labels)[:,None]
    
    # Unroll parameters
    nn_params = np.hstack((Theta1.ravel(), Theta2.ravel()))
    
    # Short hand for cost function
    def costFunc(p):
        return nnCostFunction(p, input_layer_size, hidden_layer_size, \
                              num_labels, X, y, lmbda)
    def gradFunc(p):
        return nnGradFunction(p, input_layer_size, hidden_layer_size, num_labels, X, y, lmbda)
    grad = gradFunc(nn_params)
    numgrad = computeNumericalGradient(costFunc, nn_params)
    
    # Visually examine the two gradient computations.  The two columns
    # you get should be very similar. 
    print(np.c_[numgrad, grad])
    print(['The above two columns you get should be very similar.\n' \
             '(Left-Your Numerical Gradient, Right-Analytical Gradient)\n\n'])
    
    # Evaluate the norm of the difference between two solutions.  
    # If you have a correct implementation, and assuming you used EPSILON = 0.0001 
    # in computeNumericalGradient.m, then diff below should be less than 1e-9
    minus = numgrad - grad
    minus2 = minus * minus
    sum1=np.sum(minus2)
    minus3 = np.sqrt(sum1)
    plus  = numgrad + grad
    numeritor = np.linalg.norm(minus, 2)
    Denominator = np.linalg.norm(plus, 2)
    diff = numeritor / Denominator
    
    print(['If your backpropagation implementation is correct, then \n' \
             'the relative difference will be small (less than 1e-9). \n' \
             '\nRelative Difference: #g\n'], diff)