import numpy  as np
import matplotlib.pyplot as plt
%matplotlib inline
import matplotlib.figure
import importlib, os, sys, h5py
import submitted


def show_image_with_rectangles(image,rects):
    fig=plt.figure(figsize=(7,7))
    plt.imshow(image)
    for rect in rects:
        x = rect[0]+np.array([-rect[2]/2,rect[2]/2])
        y = rect[1]+np.array([-rect[3]/2,rect[3]/2])
        plt.plot(x,y[0]*np.ones(2),'c-',linewidth=3)
        plt.plot(x,y[1]*np.ones(2),'c-',linewidth=3)
        plt.plot(x[0]*np.ones(2),y,'c-',linewidth=3)
        plt.plot(x[1]*np.ones(2),y,'c-',linewidth=3)


#import submitted
#importlib.reload(submitted)
#dataset = submitted.Dataset('data')
#datum=dataset[0]
#for k in datum.keys():
#    print('Object %s has shape %s'%(k,datum[k].shape))
with h5py.File('data.hdf5','r') as f:
    features = f['features'][:]
    rects = f['rects'][:]
    targets = f['targets'][:]
    anchors = f['anchors'][:]
with h5py.File('images.hdf5','r') as f:
    images = f['images'][:]
print('The input to the neural net are the features, whose shape is',features.shape)
print('The neural net target output is target, whose shape is',targets.shape)
print('The images are available if we want to look at them, their shape is ',images.shape)
print('The original WIDER rectangle definitions, too.  Their shape is',rects.shape)

The input to the neural net are the features, whose shape is (50, 8, 8, 512)
The neural net target output is target, whose shape is (50, 8, 8, 9, 5)
The images are available if we want to look at them, their shape is  (50, 224, 224, 3)
The original WIDER rectangle definitions, too.  Their shape is (50, 10, 10)


with h5py.File('weights_initial.hdf5','r') as f:
    W1=f['W1'][:]
    W2=f['W2'][:]
print('W1 has shape',W1.shape)
print('W2 has shape',W2.shape)

W1 has shape (3, 3, 512, 128)
W2 has shape (1, 1, 128, 9, 5)


fig = plt.figure(figsize=(14,4))
plt.plot(np.arange(512),W1[0,0,:,0])

[<matplotlib.lines.Line2D at 0x7fe3b4dd8400>]


show_image_with_rectangles(images[0,:,:,:]/255,rects[0,:,:])


with h5py.File('data.hdf5','r') as f:
    anchors = f['anchors'][:]
print(anchors.shape)

(8, 8, 9, 4)


show_image_with_rectangles(images[0,:,:,:],anchors[:,:,0,:].reshape((8*8,4)))


show_image_with_rectangles(images[0,:,:,:],anchors[3,3,:,:])


def target2rect(regression_target, anchor):
    rect = np.zeros(4)
    rect[0] = regression_target[0]*anchor[2]+anchor[0]
    rect[1] = regression_target[1]*anchor[3]+anchor[1]
    rect[2] = np.exp(min(np.log(2),regression_target[2]))*anchor[2]
    rect[3] = np.exp(min(np.log(2),regression_target[3]))*anchor[3]
    return(rect)


target_rects = []
for n1 in range(8): # 8 positions in N1
    for n2 in range(8): # 8 positions in N2
        for a  in range(9): # 9 anchors per position
            if targets[0,n1,n2,a,4]==1:
                rect = target2rect(targets[0,n1,n2,a,0:4],anchors[n1,n2,a,:])
                target_rects.append(rect)
                print('x=%d, y=%d, a=%d, target (%2.2f,%2.2f,%2.2f,%2.2f)'%(n1,n2,a,*targets[0,n1,n2,a,0:4]),
                        'becomes rect (%2.2f,%2.2f,%2.2f,%2.2f)'%(rect[0],rect[1],rect[2],rect[3]))
print('There are %d target rectangles for this image'%(len(target_rects)))

x=0, y=4, a=0, target (2.81,-1.38,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=0, y=4, a=1, target (1.98,-1.95,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=0, y=5, a=1, target (1.98,-2.52,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=0, y=5, a=2, target (1.40,-3.56,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=0, y=6, a=2, target (1.40,-4.37,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=0, y=7, a=2, target (1.40,-5.18,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=1, y=4, a=0, target (2.00,-1.38,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=1, y=5, a=0, target (2.00,-1.78,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=1, y=6, a=0, target (2.00,-2.19,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=1, y=6, a=1, target (1.41,-3.09,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=1, y=7, a=1, target (1.41,-3.66,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=5, a=0, target (-2.04,-1.78,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=5, a=1, target (-1.44,-2.52,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=5, a=2, target (-1.02,-3.56,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=6, a=0, target (-2.04,-2.19,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=6, a=1, target (-1.44,-3.09,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=6, a=2, target (-1.02,-4.37,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=7, a=0, target (-2.04,-2.59,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=7, a=1, target (-1.44,-3.66,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=6, y=7, a=2, target (-1.02,-5.18,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=4, a=0, target (-2.85,-1.38,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=4, a=1, target (-2.02,-1.95,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=4, a=2, target (-1.43,-2.76,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=5, a=0, target (-2.85,-1.78,0.30,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=5, a=1, target (-2.02,-2.52,-0.05,-0.15) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=5, a=2, target (-1.43,-3.56,-0.39,0.20) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=6, a=3, target (-1.43,-1.09,-0.39,-1.19) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=6, a=4, target (-1.01,-1.55,-0.74,-0.84) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=6, a=5, target (-0.71,-2.19,-1.09,-0.50) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=7, a=3, target (-1.43,-1.30,-0.39,-1.19) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=7, a=4, target (-1.01,-1.83,-0.74,-0.84) becomes rect (111.56,65.42,26.69,24.10)
x=7, y=7, a=5, target (-0.71,-2.59,-1.09,-0.50) becomes rect (111.56,65.42,26.69,24.10)
There are 32 target rectangles for this image


show_image_with_rectangles(images[0,:,:,:],target_rects)


importlib.reload(submitted)
help(submitted.conv2)

Help on function conv2 in module submitted:

conv2(H, W, padding)
    Compute a 2D convolution.  Compute only the valid outputs, after padding H with 
    specified number of rows and columns before and after.
    
    Input:
      H (N1,N2) - input image
      W (M1,M2) - impulse response, indexed from -M1//2 <= 
      padding (scalar) - number of rows and columns of zeros to pad before and after H
    
    Output:
      Xi  (N1-M1+1+2*padding,N2-M2+1+2*padding) - output image
         The output image is computed using the equivalent of 'valid' mode,
         after padding H  with "padding" rows and columns of zeros before and after the image.
    
    Xi[n1,n2] = sum_m1 sum_m2 W[m1,m2] * H[n1-m1,n2-m2]


importlib.reload(submitted)
zero_padded_square = np.zeros((9,9))
zero_padded_square[3:6,3:6] = 1/3
unpadded_square = np.ones((3,3))/3
pyramid = submitted.conv2(zero_padded_square, unpadded_square, 1)
fig, ax = plt.subplots(1,3,figsize=(14,6))
ax[0].imshow(zero_padded_square, cmap='gray')
ax[0].set_title('zero padded square')
ax[1].imshow(unpadded_square,cmap='gray')
ax[1].set_title('unpadded square')
ax[2].imshow(pyramid,cmap='gray')
ax[2].set_title('pyramid')

Text(0.5, 1.0, 'pyramid')


importlib.reload(submitted)
small_pyramid = submitted.conv2(zero_padded_square, zero_padded_square, 1)
fig,ax = plt.subplots(figsize=(5,4))
ax.imshow(small_pyramid,cmap='gray')

<matplotlib.image.AxesImage at 0x7fe3b36131f0>


importlib.reload(submitted)
W = np.zeros((3,3,3,3))
for c in range(3):
    W[:,:,c,c] = small_pyramid/3
H = np.zeros((9,9,3))
H[0:3,0:3,0] = 1/2 # red is turned on in upper left corner
H[0:3,6:9,1] = 1/2 # green is turned on in upper right corner
H[6:9,0:3,2] = 1/2 # blue is turned on in lower left corner
importlib.reload(submitted)
Xi = submitted.conv_layer(H,W,1)
fig, ax = plt.subplots(1,2,figsize=(12,4))
ax[0].imshow(H[:,:,:])
ax[0].set_title('input image')
ax[1].imshow(Xi[:,:,:])
ax[1].set_title('output image')

Text(0.5, 1.0, 'output image')


importlib.reload(submitted)
fig, ax = plt.subplots(1,2,figsize=(14,4))
ax[0].plot(np.arange(-200,200), submitted.sigmoid(np.arange(-200,200)))
ax[0].set_title('Sigmoid from -200 to 200')
ax[1].plot(np.arange(-200,200)/50, submitted.sigmoid(np.arange(-200,200)/50))
ax[1].set_title('Sigmoid from -4 to 4')

Text(0.5, 1.0, 'Sigmoid from -4 to 4')


importlib.reload(submitted)
fig, ax = plt.subplots(1,2,figsize=(14,4))
x = np.exp(np.arange(-200,200))
ax[0].plot(x, submitted.safe_log(x))
ax[0].set_title('Safe log from exp(-200) to exp(200)')
x = np.exp(np.arange(-200,200)/50)
ax[1].plot(x, submitted.safe_log(x))
ax[1].set_title('Safe log from exp(-4) to exp(4)')

Text(0.5, 1.0, 'Safe log from exp(-4) to exp(4)')


importlib.reload(submitted)
help(submitted.forwardprop)

Help on function forwardprop in module submitted:

forwardprop(X, W1, W2)
    Compute forward propagation of the FasterRCNN network.
    
    Inputs:
      X (N1,N2,NC) - input features
      W1 (M1,M2,NC,ND) -  weight tensor for the first layer
      W2 (1,1,ND,NA,NY) - weight tensor for the second layer
    
    Outputs:
      H (N1,N2,ND) - hidden layer activations
      Yhat (N1,N2,NA,NY) - outputs
    
    Interpretation of the outputs:
      Yhat[n1,n2,a,:4] - regression output, (n1,n2) pixel, a'th anchor
      Yhat[n1,n2,a,4] - classfication output, (n1,n2) pixel, a'th anchor


importlib.reload(submitted)
import time
print('Time before one image forwardprop is',time.perf_counter())
H, Yhat = submitted.forwardprop(features[0,:,:,:], W1, W2)
print('H  has the shape',H.shape,'and Yhat has the shape',Yhat.shape)
print('Time after one image forwardpropr is',time.perf_counter())

Time before one image forwardprop is 23.750850781
H  has the shape (8, 8, 128) and Yhat has the shape (8, 8, 9, 5)
Time after one image forwardpropr is 35.991616722


importlib.reload(submitted)
help(submitted.detect)

Help on function detect in module submitted:

detect(Yhat, number_to_return, anchors)
    Input:
      Yhat (N1,N2,NA,NY) - neural net outputs for just one image
      number_to_return (scalar) - the number of rectangles to return
      anchors (N1,N2,NA,NY) - the set of standard anchor rectangles
    Output:
      best_rects (number_to_return,4) - [x,y,w,h] rectangles most likely to contain faces.
      You should find the number_to_return rows, from Yhat,
      with the highest values of Yhat[n1,n2,a,4],
      then convert their corresponding Yhat[n1,n2,a,0:4] 
      from regression targets back into rectangles
      (i.e., reverse the process in rect_regression()).


importlib.reload(submitted)
best_rects = submitted.detect(Yhat, 10, anchors)
show_image_with_rectangles(images[0,:,:,:],best_rects)


importlib.reload(submitted)
help(submitted.loss)

Help on function loss in module submitted:

loss(Yhat, Y)
    Compute the two loss terms for the FasterRCNN network, for one image.
    
    Inputs:
      Yhat (N1,N2,NA,NY) - neural net outputs
      Y (N1,N2,NA,NY) - targets
    Outputs:
      bce_loss (scalar) - 
        binary cross entropy loss of the classification output,
        averaged over all positions in the image, averaged over all anchors 
        at each position.
      mse_loss (scalar) -
        0.5 times the mean-squared-error loss of the regression output,
        averaged over all of the targets (images X positions X  anchors) where
        the classification target is  Y[n1,n2,a,4]==1.  If there are no such targets,
        then mse_loss = 0.


importlib.reload(submitted)
bce_loss, mse_loss = submitted.loss(Yhat, targets[0,:,:,:,:])
print('BCE loss for this image is %g, MSE loss is %g'%(bce_loss, mse_loss))

BCE loss for this image is 0.695076, MSE loss is 5.8094


importlib.reload(submitted)
help(submitted.backprop)

Help on function backprop in module submitted:

backprop(Y, Yhat, H, W2)
    Compute back-propagation in the Faster-RCNN network.
    Inputs:
      Y (N1,N2,NA,NY) - training targets
      Yhat (N1,N2,NA,NY) - network outputs
      H (N1,N2,ND) - hidden layer activations
      W2 (1,1,ND,NA,NY) - second-layer weights
    Outputs:
      GradXi1 (N1,N2,ND) - derivative of loss w.r.t. 1st-layer excitations
      GradXi2 (N1,N2,NA,NY) - derivative of loss w.r.t. 2nd-layer excitations
    
    BUG WARNING:
      At the time of this writing (12/1/2021) there is a bug in the solutions.
      Please write your code to do the same thing:
      Rather than GradXi1 and GradXi2 being derivatives of the MSE and averaged BCE,
      they are actually derivatives of the sum-squared error and summed BCE.
      In other words, when you calculate the gradient, don't divide by the 
      denominators that you used in the loss function.


importlib.reload(submitted)
GradXi1, GradXi2 = submitted.backprop(targets[0,:,:,:,:],Yhat,H,W2)


fig, ax = plt.subplots(2,2,figsize=(10,8))
ax[0,0].imshow(np.average(H,axis=2).T)
ax[0,0].set_title('$h^{(1)}[n_1,n_2,:]$ activations')
ax[1,0].imshow(np.average(GradXi1,axis=2).T)
ax[1,0].set_title('$∇_ξ^{(1)}L[n_1,n_2,:]$ loss gradient')
ax[0,1].imshow(np.average(Yhat[:,:,:,4],axis=2).T)
ax[0,1].set_title('$y^{(2)}[n_1,n_2,:]$ classifier outputs')
ax[1,1].imshow(np.average(GradXi2[:,:,:,4],axis=2).T)
ax[1,1].set_title('$∇_ξ^{(2)}L[n_1,n_2,:]$ loss gradient')

Text(0.5, 1.0, '$∇_ξ^{(2)}L[n_1,n_2,:]$ loss gradient')


importlib.reload(submitted)
help(submitted.weight_gradient)

Help on function weight_gradient in module submitted:

weight_gradient(X, H, GradXi1, GradXi2, M1, M2)
    Compute weight gradient in the Faster-RCNN network.
    Inputs:
      X (N1,N2,NC) - network inputs
      H (N1,N2,ND) - hidden-layer activations
      GradXi1 (N1,N2,ND) - gradient of loss w.r.t. layer-1 excitations
      GradXi2 (N1,N2,NA,NY) - gradient of loss w.r.t. layer-2 excitations
      M1 - leading dimension of W1
      M2 - second dimension of W1
    Outputs:
      dW1 (M1,M2,NC,ND) - gradient of loss w.r.t. layer-1 weights
      dW2 (1,1,ND,NA,NY) -  gradient of loss w.r.t. layer-2 weights


importlib.reload(submitted)
dW1,dW2 = submitted.weight_gradient(features[0,:,:,:],H,GradXi1,GradXi2,3,3)


fig, ax = plt.subplots(2,2,figsize=(10,8))
ax[0,0].imshow(np.average(W1,axis=(2,3)).T)
ax[0,0].set_title('$W^{(1)}[m_1,m_2]$, averaged across channels')
ax[1,0].imshow(np.average(dW1,axis=(2,3)).T)
ax[1,0].set_title('$∇_{W^{(1)}}L[m_1,m_2]$, averaged across channels')
ax[0,1].imshow(W2[0,0,:,:,4].T,aspect='auto')
ax[0,1].set_title('$W^{(2)}[d,a]$, classification output')
ax[0,1].set_ylabel('anchor number $a$')
ax[1,1].imshow(dW2[0,0,:,:,4].T,aspect='auto')
ax[1,1].set_title('$∇_{W^{(2)}}L[m_1,m_2]$, classification output')
ax[1,1].set_ylabel('anchor number $a$')
ax[1,1].set_xlabel('hidden node number $d$')

Text(0.5, 0, 'hidden node number $d$')


importlib.reload(submitted)
help(submitted.weight_update)

Help on function weight_update in module submitted:

weight_update(W1, W2, dW1, dW2, learning_rate)
    Input: 
      W1 (M1,M2,NC,ND) = first layer weights
      W2 (1,1,ND,NA,NY) = second layer weights
      dW1 (M1,M2,NC,ND) = first layer weights
      dW2 (1,1,ND,NA,NY) = second layer weights
      learning_rate = scalar learning rate
    Output:
      new_W1 (M1,M2,NC,ND) = first layer weights
      new_W2 (1,1,ND,NA,NY) = second layer weights


importlib.reload(submitted)
new_W1, new_W2 = submitted.weight_update(W1,W2,dW1,dW2,0.0001)


fig, ax = plt.subplots(2,2,figsize=(10,8))
ax[0,0].imshow(np.average(W1,axis=(2,3)).T)
ax[0,0].set_title('old $W^{(1)}[m_1,m_2]$, averaged across channels')
ax[1,0].imshow(np.average(new_W1,axis=(2,3)).T)
ax[1,0].set_title('new $W^{(1)}[m_1,m_2]$, averaged across channels')
ax[0,1].imshow(W2[0,0,:,:,4].T,aspect='auto')
ax[0,1].set_title('old $W^{(2)}[d,a]$, classification output')
ax[0,1].set_ylabel('anchor number $a$')
ax[1,1].imshow(new_W2[0,0,:,:,4].T,aspect='auto')
ax[1,1].set_title('new $W^{(2)}[m_1,m_2]$, classification output')
ax[1,1].set_ylabel('anchor number $a$')
ax[1,1].set_xlabel('hidden node number $d$')

Text(0.5, 0, 'hidden node number $d$')


importlib.reload(submitted)
steps_to_try = np.arange(-10,11)/10000
bce_losses = np.zeros(steps_to_try.shape)
mse_losses = np.zeros(steps_to_try.shape)
for t,stepsize in enumerate(steps_to_try):
    W1_tmp, W2_tmp = submitted.weight_update(W1,W2,dW1,dW2,stepsize)
    H_tmp, Yhat_tmp = submitted.forwardprop(features[0,:,:,:], W1_tmp, W2_tmp)
    bce_losses[t], mse_losses[t] = submitted.loss(Yhat_tmp, targets[0,:,:,:,:])
    print('Step %d (step %g): bce_loss=%g, mse_loss=%g'%(t,stepsize,bce_losses[t],mse_losses[t]))

Step 0 (step -0.001): bce_loss=-0, mse_loss=28417.8
Step 1 (step -0.0009): bce_loss=-0, mse_loss=18815
Step 2 (step -0.0008): bce_loss=-0, mse_loss=11888.6
Step 3 (step -0.0007): bce_loss=0.0625758, mse_loss=7085.96
Step 4 (step -0.0006): bce_loss=0.43611, mse_loss=3918.5
Step 5 (step -0.0005): bce_loss=1.39533, mse_loss=1962.11
Step 6 (step -0.0004): bce_loss=6.7684, mse_loss=857.044
Step 7 (step -0.0003): bce_loss=14.1277, mse_loss=307.821
Step 8 (step -0.0002): bce_loss=13.6698, mse_loss=83.3442
Step 9 (step -0.0001): bce_loss=3.71005, mse_loss=16.8123
Step 10 (step 0): bce_loss=0.695076, mse_loss=5.8094
Step 11 (step 0.0001): bce_loss=0.220034, mse_loss=2.85048
Step 12 (step 0.0002): bce_loss=0.394649, mse_loss=9.11563
Step 13 (step 0.0003): bce_loss=0.852814, mse_loss=62.7603
Step 14 (step 0.0004): bce_loss=1.49357, mse_loss=226.074
Step 15 (step 0.0005): bce_loss=2.31297, mse_loss=585.43
Step 16 (step 0.0006): bce_loss=3.31087, mse_loss=1251.33
Step 17 (step 0.0007): bce_loss=3.16788, mse_loss=2358.31
Step 18 (step 0.0008): bce_loss=1.71092, mse_loss=4064.99
Step 19 (step 0.0009): bce_loss=1.17039, mse_loss=6554.1
Step 20 (step 0.001): bce_loss=0.238894, mse_loss=10032.5


fig, ax = plt.subplots(2,1,figsize=(10,8))
ax[0].plot(steps_to_try,bce_losses)
ax[0].set_title('BCE loss as a function of step size in negative-weight-gradient direction')
ax[1].plot(steps_to_try,mse_losses)
ax[1].set_title('MSE loss as a function of step size in negative-weight-gradient direction')

Text(0.5, 1.0, 'MSE loss as a function of step size in negative-weight-gradient direction')

ECE 417 MP5: Face Detection using Faster RCNN¶

0. Browsing the Data¶

1. Provided Utility Functions: conv2, conv_layer, and sigmoid¶

2. forwardprop¶

3. detect¶

4. loss¶

5. backprop¶

BUG ALERT!¶

6. weight_gradient¶

7. weight_update¶

8. Debugging: Check to make sure that the loss is decreasing¶

9. Conclusion¶