import os, h5py
import numpy as np
import matplotlib.figure
import matplotlib.pyplot as plt
%matplotlib inline
import importlib
import submitted


with h5py.File('data.hdf5','r') as f:
    print('data.hdf5 has the keys',f.keys())
    mri_dft = f['mri_dft'][:]
    image = f['image'][:]
    noisy_image = f['noisy_image'][:]
print('mri_dft is an array of shape',mri_dft.shape,'and dtype',mri_dft.dtype)
print('image is an array of shape',image.shape,'and dtype',image.dtype)
print('noisy_image is an array of shape',noisy_image.shape,'and dtype',noisy_image.dtype)

data.hdf5 has the keys <KeysViewHDF5 ['image', 'mri_dft', 'noisy_image']>
mri_dft is an array of shape (1114, 962) and dtype complex128
image is an array of shape (213, 320, 3) and dtype float64
noisy_image is an array of shape (213, 320, 3) and dtype float64


fig,ax = plt.subplots(figsize=(10,8))
ax.imshow(np.maximum(0,np.real(np.fft.ifft2(mri_dft))), cmap='gray')

<matplotlib.image.AxesImage at 0x7fa75d9b7400>


fig, ax = plt.subplots(figsize=(14,4))
ax.stem(np.abs(mri_dft[4,0:200]))

<ipython-input-11-14dc0ff74da3>:2: UserWarning: In Matplotlib 3.3 individual lines on a stem plot will be added as a LineCollection instead of individual lines. This significantly improves the performance of a stem plot. To remove this warning and switch to the new behaviour, set the "use_line_collection" keyword argument to True.
  ax.stem(np.abs(mri_dft[4,0:200]))

<StemContainer object of 3 artists>


fig,ax = plt.subplots(figsize=(10,8))
downsampling_factor = 2
ax.imshow(np.real(np.fft.ifft2(mri_dft[::downsampling_factor,::downsampling_factor])), cmap='gray')

<matplotlib.image.AxesImage at 0x7fa7437752e0>


importlib.reload(submitted)
help(submitted.downsample_and_shift_dft2)

Help on function downsample_and_shift_dft2 in module submitted:

downsample_and_shift_dft2(oversampled_dft, downsampling_factor, row_shift, col_shift)
    Input: 
      oversampled_dft [M1,M2] - a 2d array containing the oversampled DFT of a grayscale image
      downsampling_factor (scalar) - the factor by which the DFT image is oversampled
      row_shift (scalar)  - the number of rows that the image should be shifted
      col_shift (scalar) - the number of columns that the image should be shifted
    Output: 
      image [M1/downsampling_factor, M2/downsampling_factor] - the real part of the inverse DFT
      of the valid frequency samples, shifted by the specified numbers of rows and columns.


importlib.reload(submitted)
N1, N2 = mri_dft.shape
print('The original MRI_DFT shape is',N1,N2)
image = submitted.downsample_and_shift_dft2(mri_dft,2,N1/4,N2/4)
print('The downsampled image has shape', image.shape)
fig, ax = plt.subplots(figsize=(10,8))
ax.imshow(np.maximum(0,np.minimum(255,image)),cmap='gray')

The original MRI_DFT shape is 1114 962
The downsampled image has shape (557, 481)

<matplotlib.image.AxesImage at 0x7fa743735f10>


with h5py.File('data.hdf5','r') as f:
    image = f['image'][:]
    noisy_image = f['noisy_image'][:]
fig, ax = plt.subplots(1,2,figsize=(14,8))
ax[0].imshow(image)
ax[1].imshow(noisy_image)

<matplotlib.image.AxesImage at 0x7fa7437bfac0>


fig, axs = plt.subplots(4,1,figsize=(14,8))
image_dft = np.fft.fft2(image,axes=(0,1))
noisy_dft = np.fft.fft2(noisy_image, axes=(0,1))
noise = noisy_dft - image_dft
M,N,K = noisy_dft.shape
#axs[0].plot(np.abs(image_dft[:,0,1]/noise[:,0,1]))
axs[0].plot(20*np.log10(np.abs(image_dft[:,0,1]/noise[:,0,1])))
axs[0].plot(np.arange(M),np.zeros(M),'k--')
axs[0].set_title('SNR as a function of bin, Green Channel, across rows')
#axs[1].plot(np.abs(image_dft[0,:,1]/noise[0,:,1]))
axs[1].plot(20*np.log10(np.abs(image_dft[0,:,1]/noise[0,:,1])))
axs[1].plot(np.arange(N),np.zeros(N),'k--')
axs[1].set_title('SNR as a function of bin, Green Channel, across columns')
#axs[2].stem(np.abs(image_dft[:20,0,1]/noise[:20,0,1]))
axs[2].stem(20*np.log10(np.abs(image_dft[:20,0,1]/noise[:20,0,1])))
axs[2].set_title('SNR as a function of bin, Green Channel, across rows, zoomed in')
#axs[3].stem(np.abs(image_dft[0,:40,1]/noise[0,:40,1]))
axs[3].stem(20*np.log10(np.abs(image_dft[0,:40,1]/noise[0,:40,1])))
axs[3].set_title('SNR as a function of bin, Green Channel, across columns, zoomed in')
fig.tight_layout()

<ipython-input-65-5f36d00a241a>:15: UserWarning: In Matplotlib 3.3 individual lines on a stem plot will be added as a LineCollection instead of individual lines. This significantly improves the performance of a stem plot. To remove this warning and switch to the new behaviour, set the "use_line_collection" keyword argument to True.
  axs[2].stem(20*np.log10(np.abs(image_dft[:20,0,1]/noise[:20,0,1])))
<ipython-input-65-5f36d00a241a>:18: UserWarning: In Matplotlib 3.3 individual lines on a stem plot will be added as a LineCollection instead of individual lines. This significantly improves the performance of a stem plot. To remove this warning and switch to the new behaviour, set the "use_line_collection" keyword argument to True.
  axs[3].stem(20*np.log10(np.abs(image_dft[0,:40,1]/noise[0,:40,1])))


fig, axs = plt.subplots(figsize=(8,6))
print(noise.shape)
axs.imshow(np.abs(noise).astype('int'))
axs.set_xlabel('$k_2$')
axs.set_ylabel('$k_1$')
axs.set_title('Spatial Magnitude DFT of the Noise (noisy_image - image)')

Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).

(213, 320, 3)

Text(0.5, 1.0, 'Spatial Magnitude DFT of the Noise (noisy_image - image)')


importlib.reload(submitted)
help(submitted.dft_filter)

Help on function dft_filter in module submitted:

dft_filter(noisy_image, min1, max1, min2, max2)
    Input: 
      noisy_image [N1,N2] - an image with narrowband noises
      min1, max1 (scalars) - zero out all rows of the DFT min1 <= k1 < max1, likewise  for N1-k1
      min2, max2 (scalars) - zero out all cols  of the DFT min2 <= k2 < max2, likewise for N2-k2
    Outut:
      cleaned_image [N1,N2] - image with the corrupted bands removed.
      Be sure to take the real part of the inverse DFT, and then truncate
      so that 0 <= cleaned_image[n1,n2,color] <= 1 for all n1,n2,color.


importlib.reload(submitted)
cleaned_image = submitted.dft_filter(noisy_image,16,19,29,32)
fig, ax = plt.subplots(1,2,figsize=(14,8))
ax[0].imshow(image)
ax[1].imshow(cleaned_image)

<matplotlib.image.AxesImage at 0x7fa7482fe850>


importlib.reload(submitted)
help(submitted.transitioned_filter)

Help on function transitioned_filter in module submitted:

transitioned_filter(noisy_image, min1, max1, min2, max2)
    Input: 
      noisy_image [N1,N2] - an image with narrowband noises
      min1, max1 (scalars) - zero out all rows of the DFT min1 <= k1 < max1, likewise  for N1-k1
      min2, max2 (scalars) - zero out all cols  of the DFT min2 <= k2 < max2, likewise for N2-k2
    Outut:
      cleaned_image [N1,N2] - image with the corrupted bands removed.
      Be sure to take the real part of the inverse DFT, and then truncate
      so that 0 <= cleaned_image[n1,n2,color] <= 1 for all n1,n2,color.
    
    Transition band:
      the bands k1=min1-1, k1=max1, k2=min2-1, and k2=max2 should be set to half of their
      original values, 0.5*X[k1,k2].


importlib.reload(submitted)
transitioned_image = submitted.transitioned_filter(noisy_image,16,19,29,32)
fig, ax = plt.subplots(1,2,figsize=(14,10))
ax[0].imshow(cleaned_image)
ax[1].imshow(transitioned_image)

<matplotlib.image.AxesImage at 0x7fa7482f5760>


error1 = cleaned_image - image
SNR1 = 20*np.log10(np.sum(np.square(image))/np.sum(np.square(error1)))
error2 = transitioned_image - image
SNR2 = 20*np.log10(np.sum(np.square(image))/np.sum(np.square(error2)))
print('w/o Transition band we get SNR=%.1f dB, w/Transition band, %.1f dB'%(SNR1,SNR2))

w/o Transition band we get SNR=42.5 dB, w/Transition band, 43.1 dB


importlib.reload(submitted)
help(submitted.zero_pad)

Help on function zero_pad in module submitted:

zero_pad(h, x)
    (hp,xp) = zero_pad(h,x)
    Input:
      h [L] - a length-L impulse response array
      x [M] - a length-M signal array
    Return: 
      hp [N] - the same h, but zero-padded to a length of N=L+M-1
      xp [N] - the same x, but zero-padded to a length of N=L+M-1


h = 0.075*np.sinc(0.075*(np.arange(256)-127.5)) * np.hamming(256)
x = np.sin(0.05*np.pi*np.arange(500))+np.sin(0.1*np.pi*np.arange(500))
hp, xp = submitted.zero_pad(h,x)
fig, ax = plt.subplots(2,2,figsize=(14,10))
ax[0,0].plot(h)
ax[0,1].plot(hp)
ax[1,0].plot(x)
ax[1,1].plot(xp)

[<matplotlib.lines.Line2D at 0x7fa74be33580>]


X = np.fft.fft(xp)
H = np.fft.fft(hp)
Y = X*H
y = np.real(np.fft.ifft(Y))
fig, ax = plt.subplots(1,2,figsize=(14,5))
ax[0].plot(y)
ax[0].set_title('Result of ifft(X[k]H[k])')
ax[1].plot(np.convolve(x,h))
ax[1].set_title('Result of x[n]*h[n]')

Text(0.5, 1.0, 'Result of x[n]*h[n]')


import urllib.request
example_url = "https://catalog.ldc.upenn.edu/desc/addenda/LDC93S1.wav"
webdata = urllib.request.urlopen(example_url).read()
f1 = open("webdata.wav", "wb")
f1.write(webdata)
f1.close()


import soundfile as sf
speech_wave, speech_rate = sf.read("webdata.wav")
import IPython
IPython.display.Audio(data=speech_wave, rate=speech_rate)


import numpy as np
speech_power = np.average(np.square(speech_wave))
noisy_speech = speech_wave + np.sqrt(speech_power)*np.random.randn(len(speech_wave))
IPython.display.Audio(data=noisy_speech,rate=speech_rate)


import matplotlib.pyplot as plt
noise = noisy_speech - speech_wave
noise_dft = np.fft.fft(noise)
speech_dft = np.fft.fft(speech_wave)
SNR = 20*np.log10(np.abs(speech_dft)/np.abs(noise_dft))
frequency_axis = np.linspace(0,2*np.pi,len(speech_dft))
fig, ax = plt.subplots(1,2,figsize=(14,5))
ax[0].plot(frequency_axis, SNR)
ax[0].set_title('SNR vs. omega')
N = len(speech_dft)
ax[1].plot(frequency_axis[0:int(N/2)]/np.pi, SNR[0:int(N/2)])
ax[1].set_title('SNR vs. omega/pi')

Text(0.5, 1.0, 'SNR vs. omega/pi')


h =0.6*np.sinc(0.6*(np.arange(256)-127.5)) * np.hamming(256)
import time
start_time = time.time()
y_using_convolution = np.convolve(noisy_speech,h)
end_time = time.time()
print('That took', end_time-start_time, 'seconds')
IPython.display.Audio(data=y_using_convolution,rate=speech_rate)

That took 0.0051119327545166016 seconds


import importlib
importlib.reload(submitted)
help(submitted.overlap_add)

Help on function overlap_add in module submitted:

overlap_add(h, x, M)
    y = overlap_add(h, x, M)
    Input:
      h [L] - a length-L impulse response array
      x - a very long array containing the signal x
      M (scalar) - the length of frames into which x should be chopped
    Output:
      y - the result of filtering x by h using overlap-add
    
    First, zero-pad h to a length of N samples, where N=L+M-1.
    Second, compute its DFT, H.
    Third, chop x into frames of length M.  
      There should be NF of these; the last one might have fewer than M samples.
    Fourth, prepare the output array, y, of length equal to NF*M + L - 1.
    Fifth, for each frame of M samples in x:
     - zero-pad to a length of N
     - compute its DFT
     - multiply its DFT by H
     - inverse DFT
     - add the inverse DFT to the correct place in the y array
    Return y


importlib.reload(submitted)
M = 1024 + 1 - len(h)
start_time = time.time()
y_overlap_add = submitted.overlap_add(h, noisy_speech, M)
end_time = time.time()
print('That took',end_time-start_time,'seconds')
IPython.display.Audio(data=y_overlap_add,rate=speech_rate)

That took 0.005012989044189453 seconds


print('The average error is',np.average(np.abs(y_overlap_add[:len(y_using_convolution)]-y_using_convolution)))

The average error is 2.1766554318501152e-18

ECE 401 MP5: Discrete Fourier Transform¶

0. Data¶

1. MRI¶

2. Noisy Image¶

3. Transition Band¶

4. Overlap-Add¶