In [1]:

%pylab inline

Welcome to pylab, a matplotlib-based Python environment [backend: module://IPython.zmq.pylab.backend_inline].
For more information, type 'help(pylab)'.

Interpolation¶

In [2]:

from scipy import interpolate

In [3]:

def f(x):
    return np.sin(x) - 0.3 * x

In [4]:

n_m = 10
x_m = arange(n_m)
y_m = f(x_m) + 0.15*randn(n_m) # simulated measured signal

In [5]:

x_real = linspace(0, n_m-1, 100)
y_real = f(x_real)

lin_interp = interpolate.interp1d(x_m, y_m)  # return linear interpolation function
y_est_lin = lin_interp(x_real)   # evaluate at desired points

cub_interp = interpolate.interp1d(x_m, y_m, kind='cubic')  # return cubic interpolation function
y_est_cub = cub_interp(x_real)

In [6]:

fig, ax = subplots(figsize=(10,5))

ax.plot(x_real, y_real, 'k:', label='actual')
ax.plot(x_m, y_m, 'bo', label='measured')
ax.plot(x_real, y_est_lin, 'g-', label='linear')
ax.plot(x_real, y_est_cub, 'r-', label='cubic')
legend(loc='lower left')

Out[6]:

<matplotlib.legend.Legend at 0x106ec5290>

Statistics¶

scipy.stats is the core statistics library (distribution functions and common statisitical testing functions).

For modelling and more advanced statistical data exploration see Statsmodels

In [7]:

from scipy import stats

In [8]:

x = linspace(-5, 5, 100)
P = stats.norm()     # normal distribution

In [9]:

fig, ax = subplots(2,1, sharex=True)
ax[0].plot(x, P.pdf(x))
ax[0].set_title('probability density function')
ax[1].plot(x, P.cdf(x))
ax[1].set_title('cumulative density function')

Out[9]:

<matplotlib.text.Text at 0x107879190>

In [10]:

s_sample = P.rvs(size=1000)
r_sample = randn(500)
h = hist(s_sample, bins=50)
h1 = hist(r_sample, bins=50, color='red', alpha=0.6)

t-test¶

In [11]:

t_stat, p_value = stats.ttest_ind(s_sample, r_sample)
print 't_stat:', t_stat
print 'p_value:', p_value

t_stat: 0.273084133256
p_value: 0.784826184878

Least-squares fit¶

In [12]:

from scipy import stats

In [13]:

np = 50
x = linspace(-10, 20, np)

a0, b0 = 0.75, -3

y = a0 * x + b0
y_noise = y + randn(np)*2

In [14]:

resu = stats.linregress(x, y_noise)
a, b = resu[0:2]

y_fit = a*x + b

eq_lbl = '$y = %7.2f x %+7.2f$' % (a,b)

plot(x, y_noise, 'ko')
plot(x, y_fit, 'b-', label=eq_lbl)
legend(loc='upper left')

Out[14]:

<matplotlib.legend.Legend at 0x107c11f50>

In [15]:

# same task using polynomial fit
a, b = polyfit(x, y_noise, 1)
y_fit = polyval((a,b), x)

eq_lbl = '$y = %7.2f x %+7.2f$' % (a,b)

plot(x, y_noise, 'ko')
plot(x, y_fit,'b-', label=eq_lbl)
legend(loc='upper left')

Out[15]:

<matplotlib.legend.Legend at 0x107fe1d50>

In [16]:

a0, b0, c0 = 0.5, -1.4, 8.0
y = a0*x**2 + b0*x + c0
y_noise = y + randn(np)*10
plot(x, y_noise, 'ko', mfc='none')  # mfc <-> markerfacecolor

a, b, c = polyfit(x, y_noise, 2)
eq_lbl = r'$%.2f x^2 %+.2f x %+.2f$' % (a, b, c)
y_fit = polyval((a,b,c), x)
plot(x, y_fit, 'b-', label=eq_lbl, lw=2)
legend(loc='upper left')

Out[16]:

<matplotlib.legend.Legend at 0x107fd8690>

Smoothing¶

In [29]:

import numpy as np

In [30]:

x = linspace(-1, 1, 100)

pure = sin(15*x)
corrupt = pure +  0.25*randn(100)

In [37]:

# moving average
wgt = np.ones(5)
smooth = numpy.convolve(wgt/wgt.sum(), corrupt, mode='same')

In [57]:

fig, ax = subplots(figsize=(10,4))
ax.plot(x, pure, 'k-', label='original')
ax.plot(x, corrupt, label='corrupted')
ax.plot(x, smooth, 'r-', label='smoothed')
ax.set_ylim([-2,3])
legend()

Out[57]:

<matplotlib.legend.Legend at 0x109daa0d0>

window functions¶

In [62]:

length = 25
figure(figsize=(8,8))
subplot(221)
plot(np.hanning(length))
title('Hanning')
subplot(222)
plot(np.hamming(length))
title('Hamming')
subplot(223)
plot(np.bartlett(length))
title('Bartlett')
subplot(224)
plot(np.blackman(length))
title('Blackman')

Out[62]:

<matplotlib.text.Text at 0x10bd989d0>