import os, h5py
import numpy as np
import matplotlib.figure
import matplotlib.pyplot as plt
%matplotlib inline
import importlib
import submitted

with h5py.File('data.hdf5','r') as f:
    print('data.hdf5 has the keys',f.keys())
    mri_dft = f['mri_dft'][:]
    image = f['image'][:]
    noisy_image = f['noisy_image'][:]
print('mri_dft is an array of shape',mri_dft.shape,'and dtype',mri_dft.dtype)
print('image is an array of shape',image.shape,'and dtype',image.dtype)
print('noisy_image is an array of shape',noisy_image.shape,'and dtype',noisy_image.dtype)

data.hdf5 has the keys <KeysViewHDF5 ['image', 'mri_dft', 'noisy_image']>
mri_dft is an array of shape (1114, 962) and dtype complex128
image is an array of shape (213, 320, 3) and dtype float64
noisy_image is an array of shape (213, 320, 3) and dtype float64

fig,ax = plt.subplots(figsize=(10,8))
ax.imshow(np.maximum(0,np.real(np.fft.ifft2(mri_dft))), cmap='gray')

<matplotlib.image.AxesImage at 0x1230bd7b0>

fig, ax = plt.subplots(figsize=(14,4))
ax.stem(np.abs(mri_dft[0,0:200]))

<StemContainer object of 3 artists>

fig,ax = plt.subplots(figsize=(10,8))
downsampling_factor = 2
ax.imshow(np.real(np.fft.ifft2(mri_dft[::downsampling_factor,::downsampling_factor])), cmap='gray')

<matplotlib.image.AxesImage at 0x1230bec20>

importlib.reload(submitted)
help(submitted.downsample_and_shift_dft2)

Help on function downsample_and_shift_dft2 in module submitted:

downsample_and_shift_dft2(oversampled_dft, downsampling_factor, row_shift, col_shift)
    Input: 
      oversampled_dft [M1,M2] - a 2d array containing the oversampled DFT of a grayscale image
      downsampling_factor (scalar) - the factor by which the DFT image is oversampled
      row_shift (scalar)  - the number of rows that the image should be shifted
      col_shift (scalar) - the number of columns that the image should be shifted
    Output: 
      image [M1/downsampling_factor, M2/downsampling_factor] - the real part of the inverse DFT
      of the valid frequency samples, shifted by the specified numbers of rows and columns.

importlib.reload(submitted)
N1, N2 = mri_dft.shape
print('The original MRI_DFT shape is',N1,N2)
image = submitted.downsample_and_shift_dft2(mri_dft,2,N1/4,N2/4)
print('The downsampled image has shape', image.shape)
fig, ax = plt.subplots(figsize=(10,8))
ax.imshow(np.maximum(0,np.minimum(255,image)),cmap='gray')

The original MRI_DFT shape is 1114 962
The downsampled image has shape (557, 481)

<matplotlib.image.AxesImage at 0x112516770>

with h5py.File('data.hdf5','r') as f:
    image = f['image'][:]
    noisy_image = f['noisy_image'][:]
fig, ax = plt.subplots(1,2,figsize=(14,8))
ax[0].imshow(image)
ax[1].imshow(noisy_image)

<matplotlib.image.AxesImage at 0x1226bbf70>

fig, axs = plt.subplots(4,1,figsize=(14,8))
image_dft = np.fft.fft2(image,axes=(0,1))
noisy_dft = np.fft.fft2(noisy_image, axes=(0,1))
noise = noisy_dft - image_dft
M,N,K = noisy_dft.shape

axs[0].plot(np.abs(noise[:,0,1]))
axs[0].plot(np.arange(M),np.zeros(M),'k--')
axs[0].set_title('Noise as a function of FFT bin, Green Channel, across rows')

axs[1].plot(np.abs(noise[0,:,1]))
axs[1].plot(np.arange(N),np.zeros(N),'k--')
axs[1].set_title('Noise as a function of FFT bin, Green Channel, across columns')

axs[2].stem(np.abs(noise[:20,0,1]))
axs[2].set_title('Noise as a function of FFT bin, Green Channel, across rows, zoomed in')

axs[3].stem(np.abs(noise[0,:40,1]))
axs[3].set_title('Noise as a function of FFT bin, Green Channel, across columns, zoomed in')
fig.tight_layout()

fig, axs = plt.subplots(figsize=(8,6))
print(noise.shape)
axs.imshow(np.abs(noise).astype('int'))
axs.set_xlabel('$k_2$')
axs.set_ylabel('$k_1$')
axs.set_title('Spatial Magnitude DFT of the Noise (noisy_image - image)')

Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).

(213, 320, 3)

Text(0.5, 1.0, 'Spatial Magnitude DFT of the Noise (noisy_image - image)')

importlib.reload(submitted)
help(submitted.dft_filter)

Help on function dft_filter in module submitted:

dft_filter(noisy_image, min1, max1, min2, max2)
    Input: 
      noisy_image [N1,N2] - an image with narrowband noises
      min1, max1 (scalars) - zero out all rows of the DFT min1 <= k1 < max1, likewise  for N1-k1
      min2, max2 (scalars) - zero out all cols  of the DFT min2 <= k2 < max2, likewise for N2-k2
    Outut:
      cleaned_image [N1,N2] - image with the corrupted bands removed.
      Be sure to take the real part of the inverse DFT, and then truncate
      so that 0 <= cleaned_image[n1,n2,color] <= 1 for all n1,n2,color.

importlib.reload(submitted)
cleaned_image = submitted.dft_filter(noisy_image,16,19,29,32)
fig, ax = plt.subplots(1,2,figsize=(14,8))
ax[0].imshow(image)
ax[1].imshow(cleaned_image)

<matplotlib.image.AxesImage at 0x12393a680>

importlib.reload(submitted)
help(submitted.transitioned_filter)

Help on function transitioned_filter in module submitted:

transitioned_filter(noisy_image, min1, max1, min2, max2)
    Input: 
      noisy_image [N1,N2] - an image with narrowband noises
      min1, max1 (scalars) - zero out all rows of the DFT min1 <= k1 < max1, likewise  for N1-k1
      min2, max2 (scalars) - zero out all cols  of the DFT min2 <= k2 < max2, likewise for N2-k2
    Outut:
      cleaned_image [N1,N2] - image with the corrupted bands removed.
      Be sure to take the real part of the inverse DFT, and then truncate
      so that 0 <= cleaned_image[n1,n2,color] <= 1 for all n1,n2,color.
    
    Transition band:
      the bands k1=min1-1, k1=max1, k2=min2-1, and k2=max2 should be set to half of their
      original values, 0.5*X[k1,k2].

importlib.reload(submitted)
transitioned_image = submitted.transitioned_filter(noisy_image,16,19,29,32)
fig, ax = plt.subplots(1,2,figsize=(14,10))
ax[0].imshow(cleaned_image)
ax[1].imshow(transitioned_image)

<matplotlib.image.AxesImage at 0x123a12e00>

importlib.reload(submitted)
help(submitted.zero_pad)

Help on function zero_pad in module submitted:

zero_pad(h, x)
    (hp,xp) = zero_pad(h,x)
    Input:
      h [L] - a length-L impulse response array
      x [M] - a length-M signal array
    Return: 
      hp [N] - the same h, but zero-padded to a length of N=L+M-1
      xp [N] - the same x, but zero-padded to a length of N=L+M-1

h = 0.075*np.sinc(0.075*(np.arange(256)-127.5)) * np.hamming(256)
x = np.sin(0.05*np.pi*np.arange(500))+np.sin(0.1*np.pi*np.arange(500))
hp, xp = submitted.zero_pad(h,x)
fig, ax = plt.subplots(2,2,figsize=(14,10))
ax[0,0].plot(h)
ax[0,1].plot(hp)
ax[1,0].plot(x)
ax[1,1].plot(xp)

[<matplotlib.lines.Line2D at 0x1237f2f80>]

X = np.fft.fft(xp)
H = np.fft.fft(hp)
Y = X*H
y = np.real(np.fft.ifft(Y))
fig, ax = plt.subplots(1,2,figsize=(14,5))
ax[0].plot(y)
ax[0].set_title('Result of ifft(X[k]H[k])')
ax[1].plot(np.convolve(x,h))
ax[1].set_title('Result of x[n]*h[n]')

Text(0.5, 1.0, 'Result of x[n]*h[n]')

import urllib.request
example_url = "https://catalog.ldc.upenn.edu/desc/addenda/LDC93S1.wav"
webdata = urllib.request.urlopen(example_url).read()
f1 = open("webdata.wav", "wb")
f1.write(webdata)
f1.close()

!pip install soundfile

Requirement already satisfied: soundfile in /Users/jhasegaw/anaconda3/lib/python3.10/site-packages (0.12.1)
Requirement already satisfied: cffi>=1.0 in /Users/jhasegaw/anaconda3/lib/python3.10/site-packages (from soundfile) (1.16.0)
Requirement already satisfied: pycparser in /Users/jhasegaw/anaconda3/lib/python3.10/site-packages (from cffi>=1.0->soundfile) (2.21)

import soundfile as sf
speech_wave, speech_rate = sf.read("webdata.wav")
import IPython
IPython.display.Audio(data=speech_wave, rate=speech_rate)

import numpy as np
speech_power = np.average(np.square(speech_wave))
noisy_speech = speech_wave + np.sqrt(speech_power)*np.random.randn(len(speech_wave))
IPython.display.Audio(data=noisy_speech,rate=speech_rate)

import matplotlib.pyplot as plt

N = len(noisy_speech)
noise = noisy_speech - speech_wave
noise_dft = np.fft.fft(noise)
speech_dft = np.fft.fft(speech_wave)
SNR = 20*np.log10(np.abs(speech_dft)/np.abs(noise_dft))
frequency_axis = np.linspace(0,speech_rate,N)

fig, ax = plt.subplots(3,1,figsize=(14,12))
ax[0].plot(frequency_axis[:int(N/2)],np.abs(speech_dft[:int(N/2)]))
ax[0].set_title('signal power')
ax[1].plot(frequency_axis[:int(N/2)], np.abs(noise_dft[:int(N/2)]))
ax[1].set_title('noise power')
ax[2].plot(frequency_axis[:int(N/2)], SNR[:int(N/2)])
ax[2].set_title('SNR in decibels')
ax[2].set_xlabel('Frequency (Hz)')
fig.tight_layout()

h =0.4*np.sinc(0.4*(np.arange(2048)-1023.5)) * np.hamming(2048)
import time
start_time = time.time()
y_using_convolution = np.convolve(noisy_speech,h)
end_time = time.time()
print('That took', end_time-start_time, 'seconds')
IPython.display.Audio(data=y_using_convolution,rate=speech_rate)

That took 0.014723062515258789 seconds

import importlib
importlib.reload(submitted)
help(submitted.overlap_add)

Help on function overlap_add in module submitted:

overlap_add(h, x, M)
    y = overlap_add(h, x, M)
    Input:
      h [L] - a length-L impulse response array
      x - a very long array containing the signal x
      M (scalar) - the length of frames into which x should be chopped
    Output:
      y - the result of filtering x by h using overlap-add
    
    First, zero-pad h to a length of N samples, where N=L+M-1.
    Second, compute its DFT, H.
    Third, chop x into frames of length M.  
      There should be NF of these; the last one might have fewer than M samples.
    Fourth, prepare the output array, y, of length equal to NF*M + L - 1.
    Fifth, for each frame of M samples in x:
     - zero-pad to a length of N
     - compute its DFT
     - multiply its DFT by H
     - inverse DFT
     - add the inverse DFT to the correct place in the y array
    Return y

importlib.reload(submitted)
M = len(h)+1
start_time = time.time()
y_overlap_add = submitted.overlap_add(h, noisy_speech, M)
end_time = time.time()
print('That took',end_time-start_time,'seconds')
IPython.display.Audio(data=y_overlap_add,rate=speech_rate)

That took 0.005684852600097656 seconds

print('The average error is',np.average(np.abs(y_overlap_add[:len(y_using_convolution)]-y_using_convolution)))

The average error is 2.679937256729359e-18

import extra, importlib
importlib.reload(extra)
help(extra.bartlett_periodogram)

Help on function bartlett_periodogram in module extra:

bartlett_periodogram(x, K, L)
    Input: 
    x (real array) = signal
    K (int) = number of frames
    L (int) = length of each frame
    Output: 
    Xsq (real array) = average squared magnitude FFT

L = 2048
K = 22
importlib.reload(extra)
Ssq = extra.bartlett_periodogram(speech_wave,K,L)
Vsq = extra.bartlett_periodogram(noise,K,L)
frequency_axis = np.linspace(0,speech_rate,L,endpoint=False)

fig, ax = plt.subplots(2,1,figsize=(14,8))
ax[0].plot(frequency_axis,Ssq)
ax[0].set_title('Bartlett periodogram of the speech signal')
ax[1].plot(frequency_axis,Vsq)
ax[1].set_title('Bartlett periodogram of the noise signal')
ax[1].set_xlabel('Frequency (Hz)')
fig.tight_layout()

importlib.reload(extra)
help(extra.wiener_filter)

Help on function wiener_filter in module extra:

wiener_filter(Ssq, Vsq)
    Input: 
    Ssq (real array, length L) = average squared magnitude FFT of the signal
    Vsq (real array, length L) = average squared magnitude FFT of the noise
    Output: 
    H (real array, length L) = frequency response of the Wiener filter
    h (real array, length L) = fftshifted impulse response of the Wiener filter

importlib.reload(extra)
H, h = extra.wiener_filter(Ssq,Vsq)

fig, ax = plt.subplots(2,1,figsize=(14,8))
ax[0].plot(frequency_axis,H)
ax[0].set_title('Wiener filter frequency response')
ax[0].set_xlabel('Frequency (Hz)')
ax[1].plot(h)
ax[1].set_title('Wiener filter impulse response')
ax[1].set_xlabel('Time (samples)')
fig.tight_layout()

importlib.reload(submitted)
M = len(h)+1
start_time = time.time()
y_overlap_add = submitted.overlap_add(h, noisy_speech, M)
end_time = time.time()
print('That took',end_time-start_time,'seconds')
IPython.display.Audio(data=y_overlap_add,rate=speech_rate)

That took 0.006409883499145508 seconds

ECE 401 MP5: Discrete Fourier Transform¶

0. Data¶

1. MRI¶

2. Noisy Image¶

3. Transition Band¶

4. Overlap-Add¶

Extra Credit: Wiener Filter¶

Estimating $|S|^2$ and $|V|^2$ ¶

Computing $H$ and $h$ ¶

ECE 401 MP5: Discrete Fourier Transform¶

0. Data¶

1. MRI¶

2. Noisy Image¶

3. Transition Band¶

4. Overlap-Add¶

Extra Credit: Wiener Filter¶

Estimating |S|2|S|^2 and |V|2|V|^2¶

Computing HH and hh¶

Estimating $|S|^2$ and $|V|^2$ ¶

Computing $H$ and $h$ ¶