import h5py
data = {}
with h5py.File('data.hdf5') as f:
    for group in f.keys():
        data[group] = {}
        for dataset in f[group].keys():
            data[group][dataset] = f[group][dataset][:]
            print('data[%s][%s] has shape %s'%
                  (group,dataset,data[group][dataset].shape))

data[mr][corner] has shape (4, 2)
data[mr][image] has shape (224, 224)
data[mr][moving] has shape (8, 2)
data[mr][static] has shape (11, 2)
data[mr][triangles] has shape (40, 3)
data[xr][fps] has shape (1,)
data[xr][fs] has shape (1,)
data[xr][moving] has shape (438, 8, 2)
data[xr][static] has shape (11, 2)
data[xr][wav] has shape (66150,)


import IPython.display
IPython.display.Audio(data['xr']['wav'],rate=data['xr']['fs'][0])


import matplotlib.pyplot as plt

fig, ax = plt.subplots(1,1,figsize=(5,5))
ax.plot(data['xr']['static'][:,0],data['xr']['static'][:,1],'b.')
ax.set_title('Palate and Pharynx of XRMB participant JW14')

Text(0.5, 1.0, 'Palate and Pharynx of XRMB participant JW14')


print('XRMB frame rate, in frames per second, is',data['xr']['fps'][0])
print('Downsampling by 10 would give',10000/data['xr']['fps'][0],'ms per frame')

XRMB frame rate, in frames per second, is 145.64520827264784
Downsampling by 10 would give 68.66 ms per frame


from matplotlib import animation

# First set up the figure, the axis, and the plot element we want to animate
fig = plt.figure(figsize=(5,5))
ax = plt.axes(xlim=(-80000, 30000), ylim=(-20000, 20000))
line, = ax.plot([], [], 'C1.', lw=1)

# Initialization function: plot the background of each frame
def init():
    ax.plot(data['xr']['static'][:,0],data['xr']['static'][:,1],'b.')
    line.set_data([],[])
    return line,

# Animation function which updates figure data, showing (x,y) points
def animate(i):
    line.set_data(data['xr']['moving'][10*i,:,0],data['xr']['moving'][10*i,:,1])
    return line,

# Call the animator.  blit=True means only re-draw the parts that have changed.
nframes = int(data['xr']['moving'].shape[0]/10)
anim = animation.FuncAnimation(fig, animate, init_func=init,
                               frames=nframes, interval=69, blit=True)

plt.close(anim._fig)


import IPython
IPython.display.HTML(anim.to_html5_video())


fig, ax = plt.subplots(1,1,figsize=(10,10))
ax.imshow(data['mr']['image'],cmap='gray')
ax.plot(data['mr']['corner'][:,0],data['mr']['corner'][:,1],'C2o')
ax.plot(data['mr']['moving'][:,0],data['mr']['moving'][:,1],'C1o')
ax.plot(data['mr']['static'][:,0],data['mr']['static'][:,1],'C0o')

[<matplotlib.lines.Line2D at 0x7fdf25a775e0>]


import numpy as np
points = np.vstack((data['mr']['corner'],data['mr']['moving'],data['mr']['static']))

fig, ax = plt.subplots(1,1,figsize=(10,10))
ax.imshow(data['mr']['image'],cmap='gray')
for i in range(data['mr']['triangles'].shape[0]):
    tri = data['mr']['triangles'][i,:]
    x = points[(tri[0],tri[1],tri[2],tri[0]),0]
    y = points[(tri[0],tri[1],tri[2],tri[0]),1]
    ax.plot(x,y,'C1')


import importlib, submitted
importlib.reload(submitted)
help(submitted.find_affine)

Help on function find_affine in module submitted:

find_affine(sourcepoints, targetpoints)
    Find the MMSE affine transform from sourcepoints to 
    targetpoints. Assume that sourcepoints and 
    targetpoints are sorted, so that they are in 
    one-to-one correspondence.
    
    @param:
    sourcepoints (Nx2): a set of source points
    targetpoints (Nx2): a set of target points
    @return:
    predictions (Nx2): the set of predicted target points, 
      augmentedsource = np.hstack((sourcepoints, np.ones((N,1))))
      predictions = augmentedsource @ affine
    affine (3x2): linear transform matrix, 
      chosen to minimize np.sum(np.square(targetpoints-predictions))


importlib.reload(submitted)
sourcepts = data['xr']['static']
targetpts = data['mr']['static']
predstatic,affine = submitted.find_affine(sourcepts, targetpts)

print('Affine transform matrix is')
print(affine)

Affine transform matrix is
[[-1.32212835e-03 -1.32467450e-04]
 [-2.00948347e-04 -2.58811101e-03]
 [ 7.26985460e+01  1.33733700e+02]]


fig, ax = plt.subplots(1,1,figsize=(5,5))
ax.imshow(data['mr']['image'],cmap='gray')
ax.plot(predstatic[:,0],predstatic[:,1],'c.')

[<matplotlib.lines.Line2D at 0x7fdf258ed750>]


from matplotlib import animation

fig, ax = plt.subplots(1,1,figsize=(5,5))
ax.imshow(data['mr']['image'],cmap='gray')
ax.plot(predstatic[:,0],predstatic[:,1],'c.')
line, = ax.plot([], [], 'C1o')

# Initialization function: plot the background of each frame
def init():
    line.set_data([],[])
    return line,

# Animation function which updates figure data, showing (x,y) points
def animate(i):
    augmented = np.hstack((data['xr']['moving'][10*i,:,:],np.ones((8,1))))
    pts = augmented @ affine
    line.set_data(pts[:,0],pts[:,1])
    return line,

# Call the animator.  blit=True means only re-draw the parts that have changed.
nframes = int(data['xr']['moving'].shape[0]/10)
anim = animation.FuncAnimation(fig, animate, init_func=init,
                               frames=nframes, interval=69, blit=True)

plt.close(anim._fig)


import IPython
IPython.display.HTML(anim.to_html5_video())


from matplotlib import animation

fig, ax = plt.subplots(1,1,figsize=(5,5))
ax.set_xlim(0,224)
ax.set_ylim(0,224)
ax.invert_yaxis()

frames = []
nframes = int(data['xr']['moving'].shape[0]/10)
for i in range(nframes):
    artists = []
    augmented = np.hstack((data['xr']['moving'][10*i,:,:],np.ones((8,1))))
    moving = augmented @ affine
    points = np.vstack((data['mr']['corner'],moving,predstatic))
    for j in range(data['mr']['triangles'].shape[0]):
        tri = data['mr']['triangles'][j,:]
        x = points[(tri[0],tri[1],tri[2],tri[0]),0]
        y = points[(tri[0],tri[1],tri[2],tri[0]),1]
        line, = ax.plot(x,y,'C1')
        artists.append(line)
    frames.append(artists)

# Call the animator.  blit=True means only re-draw the parts that have changed.
anim = animation.ArtistAnimation(fig, frames, interval=69, blit=True)

plt.close(anim._fig)


import IPython
IPython.display.HTML(anim.to_html5_video())


importlib.reload(submitted)
help(submitted.cartesian2barycentric)

Help on function cartesian2barycentric in module submitted:

cartesian2barycentric(cartesian, triangle)
    Convert an array full of pixels from 
    cartesian coordinates to barycentric 
    coordinates.
    
    @param:
    cartesian (npix,2): x,y coordinates of npix pixels
    triangle (3,2): x,y coordinates of each corner of the triangle
    @return:
    barycentric (npix,3): barycentric coordinates of the pixels. 
      Each row should be a 3-vector such that 
         barycentric @ triangle = cartesian
         and 
         np.sum(barycentric[i,:])=1 for all i.
      If the corners of the triangle are all in a straight line,
      then solving this problem requires inverting a singular matrix.
      If np.linalg.matrix_rank tells you that the matrix is singular,
      return the value "None" in place of barycentric.


importlib.reload(submitted)
tri = np.array([[0,0],[0,2],[2,0]])
print('The triangle is:\n',tri)
c = np.array([[1,1],[0.5,0.5],[1.5,1.5]])
b = submitted.cartesian2barycentric(c,tri)
for i in range(3):
    print('Cartesian %s has barycentric %s'%(str(c[i,:]),str(b[i,:])))
    
print('\n')
tri = np.array([[0,0],[1,1],[2,2]])
b = submitted.cartesian2barycentric(c,tri)
print('With this triangle:\n',tri)
print('Cartesian:\n %s\n has barycentric %s'%(str(c),str(b)))

The triangle is:
 [[0 0]
 [0 2]
 [2 0]]
Cartesian [1. 1.] has barycentric [0.  0.5 0.5]
Cartesian [0.5 0.5] has barycentric [0.5  0.25 0.25]
Cartesian [1.5 1.5] has barycentric [-0.5   0.75  0.75]


With this triangle:
 [[0 0]
 [1 1]
 [2 2]]
Cartesian:
 [[1.  1. ]
 [0.5 0.5]
 [1.5 1.5]]
 has barycentric None


importlib.reload(submitted)
help(submitted.barycentric2cartesian)

Help on function barycentric2cartesian in module submitted:

barycentric2cartesian(barycentric, triangle)
    Convert a pixel from barycentric coordinates 
    to cartesian coordinates.
    
    @param:
    barycentric (npix, 3): barycentric coordinates.
      Each row is a 3-vector, all 
      barycentric coordinates are non-negative, and
      np.sum(barycentric[i,:])=1 for all i.
    triangle (3,2): x,y coordinates of each corner of the triangle
    @return:
    cartesian (npix, 2): cartesian coordinates


importlib.reload(submitted)
tri = np.array([[0,0],[0,2],[2,0]])
print('The triangle is:\n',tri)

bary = np.array([[0,0.5,0.5], [0.5,0.25,0.25]])
c = submitted.barycentric2cartesian(bary,tri)
print('Barycentric:\n %s\nhas cartesian:\n%s'%(str(bary),str(c)))

The triangle is:
 [[0 0]
 [0 2]
 [2 0]]
Barycentric:
 [[0.   0.5  0.5 ]
 [0.5  0.25 0.25]]
has cartesian:
[[1.  1. ]
 [0.5 0.5]]


importlib.reload(submitted)
help(submitted.moving2static)

Help on function moving2static in module submitted:

moving2static(moving, moviepts, staticpts, triangles)
    Convert from a location in the movie frame
    to the corresponding location in the static image.
    It may sometimes happen that, due to rounding errors,
    one or more rows of moving can't be assigned to any 
    triangle.  If that happens, set those rows to zero.
    
    @param:
    moving (npix,2): x,y pixel locations in the movie frame
    moviepts (23,2): array of x,y points in the movie frame
    staticpts (23,2): array of x,y points in the static image
    triangles (ntri,3): array of indices of triangle corners
    @return:
    static (npix,2): x,y location of pixel in static image


importlib.reload(submitted)

staticpts=np.vstack((data['mr']['corner'],data['mr']['moving'],data['mr']['static']))

nframes = data['xr']['moving'].shape[0]
moving = np.zeros((nframes,2,2))
static = np.zeros((nframes,2,2))

for i in range(nframes):
    augmented = np.hstack((data['xr']['moving'][i,:,:],np.ones((8,1))))
    predmoving = augmented @ affine
    moviepts = np.vstack((data['mr']['corner'],predmoving,predstatic))
    
    moving[i,0,:] = (moviepts[11,:]+moviepts[8,:]+moviepts[7,:])/3
    moving[i,1,:] = (moviepts[11,:]+moviepts[8,:]+moviepts[9,:])/3
    static[i,:,:] = submitted.moving2static(moving[i,:,:],moviepts,staticpts,data['mr']['triangles'])


import matplotlib.pyplot as plt
fig, ax = plt.subplots(2,1,figsize=(14,8))
ax[0].plot(np.arange(nframes),moving[:,0],np.arange(nframes),static[:,0])
ax[0].set_title('X coordinates, moving and static',fontsize=18)
ax[0].set_ylim((0,224))
ax[1].plot(np.arange(nframes),moving[:,1],np.arange(nframes),static[:,1])
ax[1].set_title('Y coordinates, moving and static',fontsize=18)
ax[1].set_ylim((0,224))
fig.tight_layout()


importlib.reload(submitted)
help(submitted.bilinear2d)

Help on function bilinear2d in module submitted:

bilinear2d(image, coordinates)
    Use bilinear interpolation to find the value of an image
    at non-integer coordinates.  Notice that the image
    is in (y,x) order while the coordinates are in (x,y)
    order.  Notice also that there is no guarantee that 
    the input coordinates are inside the original image;
    you need to deal with the case that coordinates might
    go outside the image.
    
    @param:
    image (ny,nx): grayscale image
    coordinates (npix,2): x,y of desired pixels
    @return:
    intensities (npix,): intensities of those pixels,
      computed by bilinear interpolation.


importlib.reload(submitted)
img = np.array([[0.01,1],[100,10000]])

r = np.array([[0.6,0.7],[-0.6,0.7],[3,3]])
v = submitted.bilinear2d(img, r)
for i in range(3):
    print('img[%s] = %8.8g'%(str(r[i,:]), v[i]))

img[[0.6 0.7]] = 4228.1812
img[[-0.6  0.7]] =   70.003
img[[3. 3.]] =    10000


importlib.reload(submitted)
help(submitted.animate)

Help on function animate in module submitted:

animate(image, moviepts, staticpts, triangles)
    Generate a movie by animating a static image.
    
    @param:
    image (ny,nx): grayscale image
    moviepts (nframes,23,2): points in each frame
    staticpts (23,2): points in the static image
    triangles (ntri,3): triplets of indices
    @return:
    movie (nframes,ny,nx): frames of the movie


staticpts = np.vstack((data['mr']['corner'],data['mr']['moving'],data['mr']['static']))

nframes = int(data['xr']['moving'].shape[0]/10)
moviepts = np.zeros((nframes,23,2))
for t in range(nframes):
    augmented = np.hstack((data['xr']['moving'][10*t,:,:],np.ones((8,1))))
    moving = augmented @ affine
    moviepts[t,:,:] = np.vstack((data['mr']['corner'],moving,predstatic))

image = data['mr']['image']
triangles = data['mr']['triangles']


importlib.reload(submitted)
movie = submitted.animate(image,moviepts,staticpts,triangles)

Synthesizing frame 0 out of 43
Synthesizing frame 1 out of 43
Synthesizing frame 2 out of 43
Synthesizing frame 3 out of 43
Synthesizing frame 4 out of 43
Synthesizing frame 5 out of 43
Synthesizing frame 6 out of 43
Synthesizing frame 7 out of 43
Synthesizing frame 8 out of 43
Synthesizing frame 9 out of 43
Synthesizing frame 10 out of 43
Synthesizing frame 11 out of 43
Synthesizing frame 12 out of 43
Synthesizing frame 13 out of 43
Synthesizing frame 14 out of 43
Synthesizing frame 15 out of 43
Synthesizing frame 16 out of 43
Synthesizing frame 17 out of 43
Synthesizing frame 18 out of 43
Synthesizing frame 19 out of 43
Synthesizing frame 20 out of 43
Synthesizing frame 21 out of 43
Synthesizing frame 22 out of 43
Synthesizing frame 23 out of 43
Synthesizing frame 24 out of 43
Synthesizing frame 25 out of 43
Synthesizing frame 26 out of 43
Synthesizing frame 27 out of 43
Synthesizing frame 28 out of 43
Synthesizing frame 29 out of 43
Synthesizing frame 30 out of 43
Synthesizing frame 31 out of 43
Synthesizing frame 32 out of 43
Synthesizing frame 33 out of 43
Synthesizing frame 34 out of 43
Synthesizing frame 35 out of 43
Synthesizing frame 36 out of 43
Synthesizing frame 37 out of 43
Synthesizing frame 38 out of 43
Synthesizing frame 39 out of 43
Synthesizing frame 40 out of 43
Synthesizing frame 41 out of 43
Synthesizing frame 42 out of 43


nframes, ny, nx = movie.shape
fig, ax = plt.subplots(1,1,figsize=(5,5))
ax.set_xlim(0,nx)
ax.set_ylim(0,ny)
ax.invert_yaxis()

frames = []
for t in range(nframes):
    artist = ax.imshow(movie[t,:,:], cmap='gray')
    frames.append([ artist ])

# Call the animator.  blit=True means only re-draw the parts that have changed.
anim = animation.ArtistAnimation(fig, frames, interval=69, blit=True)

plt.close(anim._fig)


import IPython
IPython.display.HTML(anim.to_html5_video())


!python grade.py

............
----------------------------------------------------------------------
Ran 12 tests in 4.973s

OK


!pip install h5py

Requirement already satisfied: h5py in /Users/jhasegaw/anaconda3/lib/python3.10/site-packages (3.9.0)
Requirement already satisfied: numpy>=1.17.3 in /Users/jhasegaw/anaconda3/lib/python3.10/site-packages (from h5py) (1.24.3)


import h5py
with h5py.File('solutions.hdf5','r') as f:
    print(list(f.keys()))

['affine', 'bary', 'cartesian', 'coordinates', 'image', 'intensities', 'movie', 'moviepts', 'moving', 'predstatic', 'static', 'staticpts', 'triangle']


import extra, importlib
importlib.reload(extra)
help(extra.bilinear_upsample)

Help on function bilinear_upsample in module extra:

bilinear_upsample(X, newshape)
    Upsample an image using bilinear interpolation.
    You can check your result using PIL.Image.BILINEAR
    or scipy.misc.imresize, but those won't be 
    available on the autograder (see requirements.txt).
    
    @param:
    X (ny1,nx1) - input image
    newshape (2,) - new shape, in y,x order (ny2,nx2)
    @return:
    Y (ny2,nx2) - output image
    
    Note that you should find ny2 rows linearly spaced
    in the range [0,ny1) in the input image, i.e., 
    including the coordinate 0, but not including the coordinate
    ny1.  Likewise for nx.


!python grade.py

............
----------------------------------------------------------------------
Ran 12 tests in 4.808s

OK

MP1: Face animation from landmark points¶

Part 0: Reading the data¶

Part 1: MMSE Affine Transform¶

Part 2: Barycentric Coordinates¶

Part 3: Match the pixels¶

Part 4: Estimate pixel values using bilinear interpolation¶

Part 5: Generate the movie¶

Part 6: Grade your code on your own machine before submitting it!¶

Extra Credit¶