Try out astropy.models¶

Let's see what's possible with astropy.models ... we are trying this:

Chi^2 fit to a line model
Chi^2 fit to a Gauss model
Poisson likelihood (Cash statistic) fit to a Gauss model

With astropy we also want to make it work with user-defined models and user-defined fit statistics.

See: https://github.com/astropy/astropy/pull/493/

In [1]:

import numpy as np

In [2]:

from astropy.models import models, fitting, parameters

In [3]:

# We use iminuit to check the results
# http://iminuit.github.io/iminuit/
# iminuit is super light-weight, all you get is a class called Minuit,
# which can compute best-fit parameters (migrad), parameter errors
# (hesse and minos) and a few other things (e.g. fit statistic 
# profiles / contours).
# You have to write your models and fit statistics yourself.
from iminuit import Minuit

In [4]:

%pylab inline

Welcome to pylab, a matplotlib-based Python environment [backend: module://IPython.kernel.zmq.pylab.backend_inline].
For more information, type 'help(pylab)'.

Chi^2 fit with linear model¶

In [5]:

# Data
# Let's use the example from here:
# http://nbviewer.ipython.org/5030045
xdata = np.array([0, 1, 2, 3, 4, 5])
ydata = np.array([1, 1, 5, 7, 8, 12])
sigma = np.array([1, 2, 1, 2, 1, 2], dtype=float)

In [6]:

# Plot the data
plt.plot(xdata, ydata, 'o', label='true model')
plt.xlim(-0.5, 5.5)
plt.ylim(0, 13);

In [7]:

# Model
def line(x, slope, intercept):
    """Linear function (two fit parameters)"""
    return slope * x + intercept

In [8]:

# Fit statistic (not used at the moment)
def chi2(model, parameters, data):
    """Generic chi^2 function"""
    slope, intercept = parameters
    x, y, sigma = data
    chi = (y - model(*parameters)) / sigma
    chi2 = chi ** 2
    return np.sum(chi2)

iminuit¶

In [9]:

def chi2_for_line(slope, intercept):
    """
    Chi^2 statistic for given line model parameters.
    Note: The Minuit fitter is not interested in your data or model,
    only this function!
    """
    chi = (ydata - line(xdata, slope, intercept)) / sigma
    chi2 = chi ** 2
    return np.sum(chi2)

In [10]:

minuit = Minuit(chi2_for_line, pedantic=False, print_level=0)
minuit.migrad() # Compute optimum values
minuit.hesse() # Compute errors (covariance matrix as inverse Hesse matrix)
print 'values:', minuit.values
print 'errors:', minuit.errors

values: {'slope': 1.952830188677304, 'intercept': 0.7704402515790711}
errors: {'slope': 0.3071475582636637, 'intercept': 0.8504530789683833}

astropy¶

In [11]:

# Compute parameters and errors with astropy.models
poly_model = models.Poly1DModel(1)
fitter = fitting.LinearLSQFitter(poly_model)
fitter(xdata, ydata, weights=sigma ** (-1))
print dict(slope=poly_model.c1, intercept=poly_model.c0)

# TODO: Currently no way to compute parameter errors with astropy.models.

{'slope': [1.9528301886792441], 'intercept': [0.77044025157232865]}

In [12]:

class UserLineModel(models.PModel):
    """
    Line as a user-defined model in astropy

    Note: this is a lot of boilerplate code.
    But in reality there is no reason for a user
    to not use the built-in polynomial models,
    so it doesn't matter if this is not easy in astropy.
    """
    parnames = ['slope', 'intercept']

    def __init__(self, slope, intercept, paramdim=1):
        self.linear = True 
        self._slope = parameters._Parameter(name='slope', val=slope, mclass=self, paramdim=paramdim)
        self._intercept = parameters._Parameter(name='intercept', val=intercept, mclass=self, paramdim=paramdim)
        models.ParametricModel.__init__(self, self.parnames, ndim=1, outdim=1, paramdim=paramdim)
        self.domain = None
        self.window = None
        self._order = 2

    def eval(self, x, params):
        return params[0] * x + params[1]

    def __call__(self, x):
        x, format = models._convert_input(x, self.paramdim)
        result = self.eval(x, self.psets)
        return models._convert_output(result, format)
    
    def deriv(self, x):
        res = np.ones((len(x), 2))
        res[:,0] = x.copy()
        return res

In [13]:

# Run the example using the user-defined model
line_model = UserLineModel(slope=1, intercept=1)
fitter = fitting.LinearLSQFitter(line_model)
fitter(xdata, ydata, weights=sigma ** (-1))
print dict(slope=line_model.slope, intercept=line_model.intercept)
# TODO: Results don't match. Why!???

{'slope': [4.8820754716981112], 'intercept': [5.6525157232704402]}

In [14]:

# Trying to find out why results don't match ...
poly_model.__dict__
line_model.__dict__

Out[14]:

{'_intercept': [5.6525157232704402],
 '_ndim': 1,
 '_order': 2,
 '_outdim': 1,
 '_paramdim': 1,
 '_parameters': [4.8820754716981112, 5.6525157232704402],
 '_parcheck': {},
 '_parnames': ['slope', 'intercept'],
 '_slope': [4.8820754716981112],
 'constraints': <Constraints(UserLineModel, fixed={'slope': False, 'intercept': False}, tied={'slope': False, 'intercept': False}, bounds={'slope': (-1000000000000.0, 1000000000000.0), 'intercept': (-1000000000000.0, 1000000000000.0)}, )>,
 'domain': [0.0, 5.0],
 'fittable': True,
 'has_inverse': False,
 'linear': True,
 'window': [-1, 1]}

In [15]:

MAXITER = 100
EPS = 1e-10

class UserSLSQPFitter(fitting.Fitter):
    """
    User-defined chi^2 fitter in astropy

    Note: this is a lot of boilerplate code.
    """
    def __init__(self, model, fixed=None, tied=None, bounds=None,
                 eqcons=None, ineqcons=None):
        fitting.Fitter.__init__(self, model, fixed=fixed, tied=tied, bounds=bounds,
                                eqcons=eqcons, ineqcons=ineqcons)

    def errorfunc(self, fps, *args):
        meas = args[0]
        self.fitpars = fps
        res = self.model(*args[1:]) - meas
        return np.sum(res**2)

    def __call__(self, x, y , maxiter=MAXITER, epsilon=EPS):
        self.fitpars = optimize.fmin_slsqp(self.errorfunc, p0=self.model.parameters[:], args=(y, x),
        bounds=self.constraints._bounds, eqcons=self.constraints.eqcons,
        ieqcons=self.constraints.ineqcons)

In [16]:

# Run an example with the user-defined chi^2 fitter
# TODO: Make this work
model = models.Poly1DModel(1)
fitter = UserSLSQPFitter(model)

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-16-dee76446ad32> in <module>()
      2 # TODO: Make this work
      3 model = models.Poly1DModel(1)
----> 4 fitter = UserSLSQPFitter(model)

<ipython-input-15-0019d59ba150> in __init__(self, model, fixed, tied, bounds, eqcons, ineqcons)
     11                  eqcons=None, ineqcons=None):
     12         fitting.Fitter.__init__(self, model, fixed=fixed, tied=tied, bounds=bounds,
---> 13                                 eqcons=eqcons, ineqcons=ineqcons)
     14 
     15     def errorfunc(self, fps, *args):

TypeError: __init__() got an unexpected keyword argument 'ineqcons'

ERROR: TypeError: __init__() got an unexpected keyword argument 'ineqcons' [IPython.core.interactiveshell]

In [17]:

# TODO: Run an example with the user-defined model and chi^2 fitter!

Chi^2 fit with non-linear model¶

In [18]:

# Model
def gauss(x, amplitude, mean, sigma):
    exponent = 0.5 * ((x - mean) / sigma) ** 2
    return amplitude * np.exp(-exponent)

In [19]:

# Data (simulated)
true_parameter_values=dict(amplitude=100, mean=5, sigma=1)
xdata = np.arange(0, 10, 0.1)
ydata_model = gauss(xdata, **true_parameter_values)
sigma = 10 * np.ones_like(xdata)
np.random.seed(0)
yerror = np.random.normal(0, sigma)
ydata = ydata_model + yerror

In [20]:

# Plot the data
plt.plot(xdata, ydata_model, lw=2, label='true model')
plt.plot(xdata, ydata, 'o', label='simulated data')
plt.legend();

iminuit¶

In [21]:

def chi2_for_gauss(amplitude, mean, sigma):
    """
    Chi^2 statistic for given gauss model parameters.
    """
    chi = (ydata - gauss(xdata, amplitude, mean, sigma)) / sigma
    chi2 = chi ** 2
    return np.sum(chi2)

In [22]:

minuit = Minuit(chi2_for_gauss, pedantic=False, print_level=0, **true_parameter_values)
minuit.migrad() # Compute optimum values
minuit.hesse() # Compute errors (covariance matrix as inverse Hesse matrix)
print 'values:', minuit.values
print 'errors:', minuit.errors

values: {'sigma': 1.150941192787898, 'amplitude': 88.27709771027597, 'mean': 4.975913660938593}
errors: {'sigma': 0.006012284171309272, 'amplitude': 0.3668916344659762, 'mean': 0.004395120842489413}

astropy¶

In [23]:

# Compute parameters and errors with astropy.models
gauss_model = models.Gauss1DModel(amplitude=true_parameter_values['amplitude'],
                                  xcen=true_parameter_values['mean'],
                                  xsigma=true_parameter_values['sigma'])
fitter = fitting.NonLinearLSQFitter(gauss_model)
fitter(xdata, ydata, weights=sigma ** (-1))
print dict(amplitude=gauss_model.amplitude,
           mean=gauss_model.xcen,
           sigma=gauss_model.xsigma)

# TODO: Results don't match the iminuit results from the last cell. Why?

{'sigma': [1.1162046730289203], 'amplitude': [111.43912515310208], 'mean': [5.0483590613996361]}

In [24]:

# TODO: User-defined Gauss1D model

In [25]:

# TODO: User-defined NonLinearLSQFitter

Poisson likelihood fit¶

Let's see if we can do a Poisson likelihood fit (Cash statistic) with astropy.models

In [26]:

# Model
def gauss(x, amplitude, mean, sigma):
    exponent = 0.5 * ((x - mean) / sigma) ** 2
    return amplitude * np.exp(-exponent)

In [27]:

# Data (simulated)
true_parameter_values=dict(amplitude=100, mean=5, sigma=1)
xdata = np.arange(0, 10, 0.1)
ydata_model = gauss(x, **true_parameter_values)
np.random.seed(0)
ydata = np.random.poisson(ydata_model)

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-27-d7904c03740e> in <module>()
      2 true_parameter_values=dict(amplitude=100, mean=5, sigma=1)
      3 xdata = np.arange(0, 10, 0.1)
----> 4 ydata_model = gauss(x, **true_parameter_values)
      5 np.random.seed(0)
      6 ydata = np.random.poisson(ydata_model)

NameError: name 'x' is not defined

ERROR: NameError: name 'x' is not defined [IPython.core.interactiveshell]

In [28]:

# Plot the data
plt.plot(xdata, ydata_model, lw=2, label='true model')
plt.plot(xdata, ydata, 'o', label='simulated data')
plt.legend();

In [29]:

# Fit statistic
def cash(D, M, safe=False):
    """cash fit statistic where D = data, M = model
    http://cxc.cfa.harvard.edu/sherpa/statistics/#cash

    This is simply 2 x the negative log Poisson likelihood:
    P = (M ** D) * exp(-M) / (D!)
    log(P) = D * log(M) - M - log(D!)
    cash = - 2 * log(P) (model-independent term dropped)
    """
    stat = 2 * (M - D * log(M))
    if safe:
        return np.where(M > 0, stat, 1)
    else:
        return stat

iminuit¶

In [30]:

def cash_for_gauss(amplitude, mean, sigma):
    """
    Cash statistic for given gauss model parameters.
    Note: The Minuit fitter is not interested in your data or model,
    only this function!
    """
    ydata_model = gauss(xdata, amplitude, mean, sigma)
    statval = cash(ydata, ydata_model)
    return np.sum(statval)

# TODO: check if an up=0.5 is missing to get correct errors!
minuit = Minuit(cash_for_gauss, pedantic=False, print_level=0, **true_parameter_values)
minuit.migrad() # Compute optimum values
minuit.hesse() # Compute errors (covariance matrix as inverse Hesse matrix)
print 'values:', minuit.values
print 'errors:', minuit.errors

values: {'sigma': 1.531038344360847, 'amplitude': 66.94688433626791, 'mean': 4.900701607119237}
errors: {'sigma': 0.022203455375589296, 'amplitude': 1.6325347278855415, 'mean': 0.030414683127228212}

astropy¶

In [31]:

# TODO: reproduce Minuit results from last cell with astropy

In [32]:

# TODO: User-defined cash fitter
'''
class UserCashFitter(fitting.Fitter):
    """User-defined cash statistic fitter in astropy"""
    def __init__(self, model, fixed=None, tied=None, bounds=None,
                 eqcons=None, ineqcons=None):
        fitting.Fitter.__init__(self, model, fixed=fixed, tied=tied, bounds=bounds,
                                eqcons=eqcons, ineqcons=ineqcons)

    def errorfunc(self, fps, *args):
        meas = args[0]
        self.fitpars = fps
        res = self.model(*args[1:]) - meas
        return np.sum(res**2)

    def __call__(self, x, y , maxiter=MAXITER, epsilon=EPS):
        self.fitpars = optimize.fmin_slsqp(self.errorfunc, p0=self.model.parameters[:], args=(y, x),
        bounds=self.constraints._bounds, eqcons=self.constraints.eqcons,
        ieqcons=self.constraints.ineqcons)
'''

Out[32]:

'\nclass UserCashFitter(fitting.Fitter):\n    """User-defined cash statistic fitter in astropy"""\n    def __init__(self, model, fixed=None, tied=None, bounds=None,\n                 eqcons=None, ineqcons=None):\n        fitting.Fitter.__init__(self, model, fixed=fixed, tied=tied, bounds=bounds,\n                                eqcons=eqcons, ineqcons=ineqcons)\n\n    def errorfunc(self, fps, *args):\n        meas = args[0]\n        self.fitpars = fps\n        res = self.model(*args[1:]) - meas\n        return np.sum(res**2)\n\n    def __call__(self, x, y , maxiter=MAXITER, epsilon=EPS):\n        self.fitpars = optimize.fmin_slsqp(self.errorfunc, p0=self.model.parameters[:], args=(y, x),\n        bounds=self.constraints._bounds, eqcons=self.constraints.eqcons,\n        ieqcons=self.constraints.ineqcons)\n'

Backup cells¶

In [33]:

'''
class OldLine(models.ParametricModel):
    """Old version of the Line class. Doesn't work."""
    parnames = ['slope', 'intercept']
    def __init__(self, slope, intercept, paramdim=1):
        self.linear = True
        self._slope = parameters._Parameter(name='slope', val=slope, mclass=self, paramdim=paramdim)
        self._intercept = parameters._Parameter(name='intercept', val=intercept, mclass=self, paramdim=paramdim)
        models.ParametricModel.__init__(self, self.parnames, ndim=1, outdim=1, paramdim=paramdim)
    def eval(self, x, params):
        return params[0] * x + params[1]
    def __call__(self, x):
        x, format = models._convert_input(x, self.paramdim)
        result = self.eval(x, self.psets)
        return models._convert_output(result, format)
'''

Out[33]:

'\nclass OldLine(models.ParametricModel):\n    """Old version of the Line class. Doesn\'t work."""\n    parnames = [\'slope\', \'intercept\']\n    def __init__(self, slope, intercept, paramdim=1):\n        self.linear = True\n        self._slope = parameters._Parameter(name=\'slope\', val=slope, mclass=self, paramdim=paramdim)\n        self._intercept = parameters._Parameter(name=\'intercept\', val=intercept, mclass=self, paramdim=paramdim)\n        models.ParametricModel.__init__(self, self.parnames, ndim=1, outdim=1, paramdim=paramdim)\n    def eval(self, x, params):\n        return params[0] * x + params[1]\n    def __call__(self, x):\n        x, format = models._convert_input(x, self.paramdim)\n        result = self.eval(x, self.psets)\n        return models._convert_output(result, format)\n'

In [33]:

In [ ]: