from numpy import linspace,cos,exp
import matplotlib.pyplot as plt 

limit=3
x = linspace(-limit,limit,100) 
y = (x-3)*(x-2)*(x-1)*x*(x+1)*(x+2)*(x+3) 

# 7th order polynomial. Note that this form is twice as fast on average as the following:

#y_exp = x**7 - 14*x**5 + 49*x**3 - 36*x

fig, ax = plt.subplots(figsize=(12,8)) # use subplots so we can change the axis position with spines
ax.spines['bottom'].set_position('zero')
ax.plot(x,y,'b',zorder=1,linewidth=4) 
ax.grid(True, which='both')

# testing speed and other functions.
#y_new = exp(-x)
#ax.plot(x,y_new,'r',zorder=1,linewidth=4) 
#%timeit ax.plot(x,y_exp,'r',zorder=1,linewidth=4) 


# # select the part of the data we actually interested in
# x_filt = x[(x >= 0) & (x <= 2)]
# y_filt = y[(x >= 0) & (x <= 2)]
# ax.axvspan(0, 2, alpha=0.5, color='gray')
# ax.plot(x_filt,y_filt,'y--',linewidth=4)

# # now make this region periodic
# images = 8
# for n in range(0,images,2):
#     xmin = 0
#     xmax = xmin + 2
#     x_shift = x + n - 4
#     n += 1
#     x_per = x_shift[(x >= xmin) & (x <= xmax)]
#     y_per = y[(x >= xmin) & (x <= xmax)]
#     ax.plot(x_per,y_per,'r--',linewidth=4)
    
plt.show()


from numpy import linspace,exp,pi,real,sqrt,sinh
import matplotlib.pyplot as plt 

xlimit=2*pi # period of the function we are looking at
x = linspace(0,xlimit,100) 
y = exp(x) # the original function

fig, ax = plt.subplots(figsize=(12,8)) # setup subplots so we can add a few things to the plot and move the axes
ax.spines['bottom'].set_position('zero')
ax.plot(x,y,'b',zorder=1,linewidth=4) 
ax.grid(True, which='both')

# define the function that calculates the sum of the Fourier coefficients
def ft(x):
    gamma = 0.0
    for k in range(-klimit,klimit):
        gamma += -(1j*(1-exp(2*pi*(1-1j*k)))/(k+1j))*exp(1j*k*x)
    return gamma

# explore how the Fourier function depends on the number of terms in the series

labels = ["exp(x)"] # we will have dynamically generated labels, so start the list here with the original function

for klimit in (1,5,10,50,100):
    y_ft = (1/(2*pi))*real(ft(x))
    labels.append(r'$klimit = %i$' % (klimit))
    ax.plot(x,y_ft,'--',zorder=1,linewidth=2) 

plt.legend(labels, loc='upper left', 
           columnspacing=1.0, labelspacing=0.0,
           handletextpad=1.0, handlelength=1.5,
           fancybox=True, shadow=True)
plt.show()


from numpy import linspace,cos,exp
import matplotlib.pyplot as plt 

limit=3
x1 = linspace(-limit,limit,1000) 
x2 = linspace(-limit,limit,8) 
y1 = (x1-3)*(x1-2)*(x1-1)*x1*(x1+1)*(x1+2)*(x1+3) 
y2 = (x2-3)*(x2-2)*(x2-1)*x2*(x2+1)*(x2+2)*(x2+3) # these are the same function, which is not quite correct, but the figure makes the point well.

fig, ax = plt.subplots(figsize=(12,8)) 
ax.spines['bottom'].set_position('zero')
ax.plot(x2, y2, 'o', color='black',
         markersize=15, linewidth=4,
         markerfacecolor='white',
         markeredgecolor='gray',
         markeredgewidth=2)
ax.plot(x1,y1,'b',zorder=1,linewidth=4) 
ax.plot(x2,y2,'r',zorder=1,linewidth=4) 

ax.grid(True, which='both')
plt.show()


from numpy import zeros,exp,pi

def dft(y):
    N = len(y)
    c = zeros(N//2+1,complex) # only sums over the first half of the series assuming the data is real
    for k in range(N//2+1):
        for n in range(N):
            c[k] += y[n]*exp(-2j*pi*k*n/N)
    return c


from numpy import loadtxt,size
import matplotlib.pyplot as plt

x = loadtxt("pitch.txt",float) # load the waveform we are looking at
c = dft(x)

plt.figure(figsize=(16,8)) # set the figsize
plt.subplot(1,2,1) 
plt.xlabel("$t$")
plt.ylabel("$f(t)$")
plt.plot(x)

plt.subplot(1,2,2) 
plt.xlim(0,500)
plt.xlabel("$k$")
plt.ylabel("$c_k$")
plt.plot(abs(c),'r') # plot the absolute values, since the coefficients are generally complex

plt.show()


from numpy import linspace,cos,exp
import matplotlib.pyplot as plt 

limit=3
x = linspace(-limit,limit,1000) 
y = (x-3)*(x-2)*(x-1)*x*(x+1)*(x+2)*(x+3) 

fig, ax = plt.subplots(figsize=(12,8)) 
ax.spines['bottom'].set_position('zero')
plt.xlim(-limit,7*limit)
plt.ylim(-100,100)
ax.plot(x,y,'b',zorder=1,linewidth=4) 
ax.plot(x[::45], y[::45], 'o', color='black',
         markersize=15, linewidth=4,
         markerfacecolor='white',
         markeredgecolor='gray',
         markeredgewidth=2)
ax.axvspan(-limit, limit, alpha=0.5, color='gray')
ax.grid(True, which='both')

# this can be done much more easily in Pythonic form with array manipulations, see the DCT function later, but simplicity first.
for n in range(1,limit+1):
    ax.plot(((-1)**n)*x+2*n*limit,y,'r--',zorder=1,linewidth=4) 

plt.show()


from numpy import empty,arange,exp,real,imag,pi,array,place,argwhere,size
from numpy.fft import rfft,irfft
import matplotlib.pyplot as plt
from scipy.sparse import coo_matrix

# Numpy does not have DCT directly, so we have to do it manually - note that scipy does have it, but this is a useful teaching example
######################################################################
# 1D DCT Type-II function

def dct(y):
    N = len(y)
    y2 = empty(2*N,float) # create an empty array for the function
    y2[:N] = y[:] # the first N elements of y2 are taken from y
    y2[N:] = y[::-1] # the elements after N are reversed giving us a symmetric, even function

    c = rfft(y2) # perform the fourier transform. This uses a numpy function (Real Fast Fourier Transform), otherwise everything takes too long - we will discuss it later.
    phi = exp(-1j*pi*arange(N)/(2*N)) # create an array with terms from (0-999) and use it to define the leading phase factor
    return real(phi*c[:N]) # return the real part of the transform

######################################################################
# 2D DCT function

def dct2(y):
    M = y.shape[0] # first dimension of input function, use to define limits
    N = y.shape[1] # second dimension of input function, use to define limits
    a = empty([M,N],float) # create arrays to store our result - a for the first transform and b for the second
    b = empty([M,N],float)

# run the 1D transforms
    for i in range(M):
        a[i,:] = dct(y[i,:])
    for j in range(N):
        b[:,j] = dct(a[:,j])

    return b

######################################################################
# 1D inverse DCT Type-II function

def idct(a):
    N = len(a)
    c = empty(N+1,complex)

    phi = exp(1j*pi*arange(N)/(2*N))
    c[:N] = phi*a
    c[N] = 0.0
    return irfft(c)[:N] # (Inverse Real Fast Fourier Transform)

######################################################################
# 2D inverse DCT function

def idct2(b):
    M = b.shape[0]
    N = b.shape[1]
    a = empty([M,N],float)
    y = empty([M,N],float)

    for i in range(M):
        a[i,:] = idct(b[i,:])
    for j in range(N):
        y[:,j] = idct(a[:,j])

    return y

adam = plt.imread('images/photo.tiff') # Read in TIFF picture file. TIFF is lossless, so generally very large compared to compressed formats.

singch_adam = adam[:, :, 0] # slice image into a single channel so the transform can handle it.
plt.figure(figsize=(12,6)) # set the figsize

# plot the original image
plt.subplot(1,2,1)
plt.imshow(singch_adam, cmap="plasma") # a default colourmap is applied, there are no colour channels in the data anymore
plt.colorbar()
adam_dct = dct2(singch_adam) # apply the 2D DCT to the single channel image

# plot the DCT of the image, limiting the scale so we can actually see something
plt.subplot(1,2,2)
plt.imshow(adam_dct, cmap="plasma",clim=(0, 1e4))
plt.colorbar()
plt.show()

# define a threshold for cutting the coefficients
cutoff_amplitude = 1e6 # 
place(adam_dct, abs(adam_dct) < cutoff_amplitude, [0]) # Put zeroes into array based on cutoff
original_size = adam_dct.shape[0]*adam_dct.shape[1]
components_removed = argwhere(abs(adam_dct) < cutoff_amplitude).shape[0] # Replace values below cutoff with 0

# give some nice output on how much we have cut from the DCT
percent_removed = (1-components_removed/original_size)*100
print("Removed {} out of {} components. Image contains {:.2f}% of the original components.".format(components_removed, original_size, percent_removed))

plt.figure(figsize=(12,6)) # set the figsize
plt.subplot(1,2,1)
plt.imshow(adam_dct, cmap="plasma",clim=(0, 1e4))
plt.colorbar()

adam_idct = idct2(adam_dct) # run the inverse DCT on the coefficients to generate the "compressed" image

plt.subplot(1,2,2)
plt.imshow(adam_idct, cmap="plasma")
plt.colorbar()
plt.show()

# now actually remove all the zeroes so that we are really handling a smaller array
adam_compressed = coo_matrix(adam_dct)
print("Now we have really reduced the array to {:.2f}% of its original size.".format(100*size(adam_compressed)/size(adam_dct)))

# but to actually do anything with it, we need to decompress it and see whether we lost any data.
adam_decomp = adam_compressed.toarray()

plt.figure(figsize=(12,6)) # set the figsize
plt.subplot(1,2,1)
plt.imshow(adam_decomp, cmap="plasma",clim=(0, 1e4))
plt.colorbar()

adam_idct_decomp = idct2(adam_decomp)

plt.subplot(1,2,2)
plt.imshow(adam_idct_decomp, cmap="plasma")
plt.colorbar()
plt.show()

plt.imsave('images/photo_compressed',adam_idct_decomp, format='tiff') # but this is still the same size, as we had to decompress it.

Removed 2880806 out of 2882544 components. Image contains 0.06% of the original components.

Now we have really reduced the array to 0.06% of its original size.


import matplotlib.pyplot as plt
from numpy import pi,cos,exp,real,imag,linspace
from numpy.fft import fft

def ffunc(t):
    """Function defines data to be transformed,
    in this case a cosine oscillation in time and
    exponential decay."""
    return cos(2*pi*freq*t)*exp(-t/tdecay)
freq = 200e3       # oscillation frequency (Hz), here 200 kHz
tdecay = 100e-6    # decay time (s), here 100 microseconds

# Get data to be transformed by sampling function above, and plot
nn = 200                          # number of points
tau = 1e-6                        # sampling time (s), here 1 microsec
t = linspace(0,(nn-1)*tau,nn)  # array of sample times (s)
f = ffunc(t)                      # array of sampled function points
plt.figure()
plt.plot(t/1e-6,f,label='f(t)')
plt.legend()
plt.xlabel(r'$t$ ($\mu$s)')
plt.show()

# Compute the discrete FT of the data, and plot:
ftwid = fft(f)                    # do the discrete FT
nun = 1/(2*tau)                   # Nyquist frequency (Hz), value is one-half of the sampling rate
numax = 2*((nn-1)/nn)* nun        # max frequency in the DFT (Hz)
nu = linspace(0,numax,nn)      # array of frequencies (Hz)
plt.figure()
plt.rc('font',size=12)
plt.plot(nu/1e3,real(ftwid),label=r'Re[$\tilde{f}(\nu)$]')
plt.plot(nu/1e3,imag(ftwid),label=r'Im[$\tilde{f}(\nu)$]')
plt.legend()
plt.xlabel(r'$\nu$ (kHz)')
plt.show()


from numpy import roll
# "Roll" the data to the right so zero freq will be in the middle
shift = nn//2   # points to shift the DFT data, must be int
ftwid2 = roll(ftwid,shift)

# Compute a shifted set of frequency values:
nushift = shift/(nn*tau)   # using delta-nu = 1/(nn*tau)
nu2 = nu-nushift

# Plot:
plt.figure()
plt.plot(nu2/1e3,real(ftwid2),label=r'Re[$\tilde{f}(\nu)$]')
plt.plot(nu2/1e3,imag(ftwid2),label=r'Im[$\tilde{f}(\nu)$]')
plt.legend()
plt.xlabel(r'$\nu$ (kHz)')
plt.show()


import matplotlib.pyplot as plt
from numpy import pi,cos,exp,hanning,linspace
from scipy.fftpack import dct

def ffunc(t):
    """Function defines data to be transformed,
    in this case a cosine oscillation in time and
    exponential decay."""
    return cos(2*pi*freq*t)*exp(-t/tdecay)
freq = 200e3             # oscillation frequency (Hz), here 200 kHz
tdecay = 100e-6          # decay time (s), here 100 microseconds

# Get data to be transformed by sampling function above:
nn = 200                          # number of points
tau = 1e-6                        # sampling time (s), here 1 microsec
t = linspace(0,(nn-1)*tau,nn)  # array of sample times (s)
f = ffunc(t)                      # array of sampled function points
f2 = hanning(nn)*f                # apply Hanning window
plt.figure()
plt.plot(t/1e-6,f,label='f(t)')
plt.plot(t/1e-6,f2,label='f(t) times Hanning window')
plt.legend()
plt.xlabel(r'$t$ ($\mu$s)')
plt.show()

# Compute and plot discrete FT of the data
a = dct(f)
a2 = dct(f2)               # do the disctete cosine transforms
nun = 1/(2*tau)            # Nyquist frequency (Hz)
numax = ((nn-1)/nn)* nun   # max frequency in the DCT (Hz)..
                           #  ..different from DFT by factor of 2
nu = linspace(0,numax,nn)      # array of frequencies (Hz)
plt.figure()
plt.plot(nu/1e3,abs(a),label='DCT with no window')
plt.plot(nu/1e3,abs(a2),label='DCT with Hanning window')
plt.legend()
plt.xlabel(r'$\nu$ (kHz)')
plt.show()


import warnings
warnings.filterwarnings('ignore') # generally dangerous, but librosa doesn't support mp3 at the moment and uses audioread, so warnings are annoying
from numpy import fft,linspace,sin,pi
from scipy import fftpack
import matplotlib.pyplot as plt

# use the Librosa package for handling sound files
import librosa
import librosa.display
import IPython.display as ipd

# first we can just generate a simple tone as a test
sr = 22050 # sample rate
T = 2.0    # seconds
t = linspace(0, T, int(T*sr), endpoint=False) # time variable
x = 0.5*sin(2*pi*440*t)                # pure sine wave at 440 Hz

ipd.Audio(x, rate=sr) # so we can play it if we wanted. This works only in notebooks easily, but you might find a clever solution, such as writing an audio file out.


plt.figure(figsize=(16,6)) # set the figsize
plt.subplot(1,2,1)
plt.xlim(0,1000)
plt.plot(x)

plt.subplot(1,2,2)
c = fft.rfft(x)
plt.plot(abs(c)) # should be a single peak at 440 Hz

plt.show()


# Let's try it with a some real music
audio_path = 'music.mp3'
ipd.Audio(audio_path) # you can decide whether you want to actually play it


x , sr = librosa.load(audio_path) # Load the audio as a waveform `x` and store the sampling rate as `sr`
print("Sampling rate is:",sr,"Hz")

# plot the waveform of the song
plt.figure(figsize=(14, 5))
plt.plot(x)
plt.show()

Sampling rate is: 22050 Hz


# take the fourier transform of the music file
c_music = dct(x)
plt.figure(figsize=(16,6)) # set the figsize
plt.subplot(1,2,1)
plt.plot(abs(c_music))

# Librosa has a lot of more complex analysis features
X = librosa.stft(x)
Xdb = librosa.amplitude_to_db(abs(X))
plt.subplot(1,2,2)
librosa.display.specshow(Xdb, sr=sr, x_axis='time', y_axis='hz')
plt.show()


# Let's cut some frequencies and see what happens
cutoff_frequency = 1e4 # 
place(c_music, abs(c_music) < cutoff_frequency, [0]) # Put zeroes into array when the absolute value of the frequency is less than the cutoff
plt.figure(figsize=(14,5)) # set the figsize
plt.plot(abs(c_music))

x_filter=idct(c_music)
plt.figure(figsize=(14, 5))
plt.plot(x_filter)

plt.show()


ipd.Audio(x_filter, rate=sr) # some might say it has improved...

Fourier transforms¶

Fourier series¶

Example - Gaussian function¶

Discrete Fourier Transforms¶

What does it actually mean?¶

Example - Inverse Fourier transform¶

Phase and positions of sample points¶

Discrete cosine transforms¶

DCT and compression¶

Two-dimensional Fourier transforms¶

Fast Fourier Transforms¶

Example - FFT speed comparison¶

Example - DCT speed comparison¶

Windowing and power spectrum estimation¶

A magnetic example¶

Other data sources¶

Example: Noisy function¶