pyerrors/pyerrors/fits.py

import gc
from collections.abc import Sequence
import warnings
import numpy as np
import autograd.numpy as anp
import scipy.optimize
import scipy.stats
import matplotlib.pyplot as plt
from matplotlib import gridspec
from scipy.odr import ODR, Model, RealData
import iminuit
from autograd import jacobian as auto_jacobian
from autograd import hessian as auto_hessian
from autograd import elementwise_grad as egrad
from numdifftools import Jacobian as num_jacobian
from numdifftools import Hessian as num_hessian
from .obs import Obs, derived_observable, covariance, cov_Obs


class Fit_result(Sequence):
    """Represents fit results.

    Attributes
    ----------
    fit_parameters : list
        results for the individual fit parameters,
        also accessible via indices.
    chisquare_by_dof : float
        reduced chisquare.
    p_value : float
        p-value of the fit
    t2_p_value : float
        Hotelling t-squared p-value for correlated fits.
    """

    def __init__(self):
        self.fit_parameters = None

    def __getitem__(self, idx):
        return self.fit_parameters[idx]

    def __len__(self):
        return len(self.fit_parameters)

    def gamma_method(self, **kwargs):
        """Apply the gamma method to all fit parameters"""
        [o.gamma_method(**kwargs) for o in self.fit_parameters]

    gm = gamma_method

    def __str__(self):
        my_str = 'Goodness of fit:\n'
        if hasattr(self, 'chisquare_by_dof'):
            my_str += '\u03C7\u00b2/d.o.f. = ' + f'{self.chisquare_by_dof:2.6f}' + '\n'
        elif hasattr(self, 'residual_variance'):
            my_str += 'residual variance = ' + f'{self.residual_variance:2.6f}' + '\n'
        if hasattr(self, 'chisquare_by_expected_chisquare'):
            my_str += '\u03C7\u00b2/\u03C7\u00b2exp  = ' + f'{self.chisquare_by_expected_chisquare:2.6f}' + '\n'
        if hasattr(self, 'p_value'):
            my_str += 'p-value   = ' + f'{self.p_value:2.4f}' + '\n'
        if hasattr(self, 't2_p_value'):
            my_str += 't\u00B2p-value = ' + f'{self.t2_p_value:2.4f}' + '\n'
        my_str += 'Fit parameters:\n'
        for i_par, par in enumerate(self.fit_parameters):
            my_str += str(i_par) + '\t' + ' ' * int(par >= 0) + str(par).rjust(int(par < 0.0)) + '\n'
        return my_str

    def __repr__(self):
        m = max(map(len, list(self.__dict__.keys()))) + 1
        return '\n'.join([key.rjust(m) + ': ' + repr(value) for key, value in sorted(self.__dict__.items())])


def least_squares(x, y, func, priors=None, silent=False, **kwargs):
    r'''Performs a non-linear fit to y = func(x).
        ```

    Parameters
    ----------
    For an uncombined fit:

    x : list
        list of floats.
    y : list
        list of Obs.
    func : object
        fit function, has to be of the form

        ```python
        import autograd.numpy as anp

        def func(a, x):
            return a[0] + a[1] * x + a[2] * anp.sinh(x)
        ```

        For multiple x values func can be of the form

        ```python
        def func(a, x):
            (x1, x2) = x
            return a[0] * x1 ** 2 + a[1] * x2
        ```
        It is important that all numpy functions refer to autograd.numpy, otherwise the differentiation
        will not work.

    OR For a combined fit:

    x : dict
        dict of lists.
    y : dict
        dict of lists of Obs.
    funcs : dict
        dict of objects
        fit functions have to be of the form (here a[0] is the common fit parameter)
        ```python
        import autograd.numpy as anp
        funcs = {"a": func_a,
                "b": func_b}

        def func_a(a, x):
            return a[1] * anp.exp(-a[0] * x)

        def func_b(a, x):
            return a[2] * anp.exp(-a[0] * x)

        It is important that all numpy functions refer to autograd.numpy, otherwise the differentiation
        will not work.

    priors : list, optional
        priors has to be a list with an entry for every parameter in the fit. The entries can either be
        Obs (e.g. results from a previous fit) or strings containing a value and an error formatted like
        0.548(23), 500(40) or 0.5(0.4)
    silent : bool, optional
        If true all output to the console is omitted (default False).
    initial_guess : list
        can provide an initial guess for the input parameters. Relevant for
        non-linear fits with many parameters. In case of correlated fits the guess is used to perform
        an uncorrelated fit which then serves as guess for the correlated fit.
    method : str, optional
        can be used to choose an alternative method for the minimization of chisquare.
        The possible methods are the ones which can be used for scipy.optimize.minimize and
        migrad of iminuit. If no method is specified, Levenberg-Marquard is used.
        Reliable alternatives are migrad, Powell and Nelder-Mead.
    tol: float, optional
        can be used (only for combined fits and methods other than Levenberg-Marquard) to set the tolerance for convergence
        to a different value to either speed up convergence at the cost of a larger error on the fitted parameters (and possibly
        invalid estimates for parameter uncertainties) or smaller values to get more accurate parameter values
        The stopping criterion depends on the method, e.g. migrad: edm_max = 0.002 * tol * errordef (EDM criterion: edm < edm_max)
    correlated_fit : bool
        If True, use the full inverse covariance matrix in the definition of the chisquare cost function.
        For details about how the covariance matrix is estimated see `pyerrors.obs.covariance`.
        In practice the correlation matrix is Cholesky decomposed and inverted (instead of the covariance matrix).
        This procedure should be numerically more stable as the correlation matrix is typically better conditioned (Jacobi preconditioning).
        At the moment this option only works for `prior==None` and when no `method` is given.
    expected_chisquare : bool
        If True estimates the expected chisquare which is
        corrected by effects caused by correlated input data (default False).
    resplot : bool
        If True, a plot which displays fit, data and residuals is generated (default False).
    qqplot : bool
        If True, a quantile-quantile plot of the fit result is generated (default False).
    num_grad : bool
        Use numerical differentation instead of automatic differentiation to perform the error propagation (default False).

    Returns
    -------
    output : Fit_result
        Parameters and information on the fitted result.
    '''
    if priors is not None:
        return _prior_fit(x, y, func, priors, silent=silent, **kwargs)
    else:
        return _combined_fit(x, y, func, silent=silent, **kwargs)


def total_least_squares(x, y, func, silent=False, **kwargs):
    r'''Performs a non-linear fit to y = func(x) and returns a list of Obs corresponding to the fit parameters.

    Parameters
    ----------
    x : list
        list of Obs, or a tuple of lists of Obs
    y : list
        list of Obs. The dvalues of the Obs are used as x- and yerror for the fit.
    func : object
        func has to be of the form

        ```python
        import autograd.numpy as anp

        def func(a, x):
            return a[0] + a[1] * x + a[2] * anp.sinh(x)
        ```

        For multiple x values func can be of the form

        ```python
        def func(a, x):
            (x1, x2) = x
            return a[0] * x1 ** 2 + a[1] * x2
        ```

        It is important that all numpy functions refer to autograd.numpy, otherwise the differentiation
        will not work.
    silent : bool, optional
        If true all output to the console is omitted (default False).
    initial_guess : list
        can provide an initial guess for the input parameters. Relevant for non-linear
        fits with many parameters.
    expected_chisquare : bool
        If true prints the expected chisquare which is
        corrected by effects caused by correlated input data.
        This can take a while as the full correlation matrix
        has to be calculated (default False).
    num_grad : bool
        Use numerical differentation instead of automatic differentiation to perform the error propagation (default False).

    Notes
    -----
    Based on the orthogonal distance regression module of scipy.

    Returns
    -------
    output : Fit_result
        Parameters and information on the fitted result.
    '''

    output = Fit_result()

    output.fit_function = func

    x = np.array(x)

    x_shape = x.shape

    if kwargs.get('num_grad') is True:
        jacobian = num_jacobian
        hessian = num_hessian
    else:
        jacobian = auto_jacobian
        hessian = auto_hessian

    if not callable(func):
        raise TypeError('func has to be a function.')

    for i in range(42):
        try:
            func(np.arange(i), x.T[0])
        except TypeError:
            continue
        except IndexError:
            continue
        else:
            break
    else:
        raise RuntimeError("Fit function is not valid.")

    n_parms = i
    if not silent:
        print('Fit with', n_parms, 'parameter' + 's' * (n_parms > 1))

    x_f = np.vectorize(lambda o: o.value)(x)
    dx_f = np.vectorize(lambda o: o.dvalue)(x)
    y_f = np.array([o.value for o in y])
    dy_f = np.array([o.dvalue for o in y])

    if np.any(np.asarray(dx_f) <= 0.0):
        raise Exception('No x errors available, run the gamma method first.')

    if np.any(np.asarray(dy_f) <= 0.0):
        raise Exception('No y errors available, run the gamma method first.')

    if 'initial_guess' in kwargs:
        x0 = kwargs.get('initial_guess')
        if len(x0) != n_parms:
            raise Exception('Initial guess does not have the correct length: %d vs. %d' % (len(x0), n_parms))
    else:
        x0 = [1] * n_parms

    data = RealData(x_f, y_f, sx=dx_f, sy=dy_f)
    model = Model(func)
    odr = ODR(data, model, x0, partol=np.finfo(np.float64).eps)
    odr.set_job(fit_type=0, deriv=1)
    out = odr.run()

    output.residual_variance = out.res_var

    output.method = 'ODR'

    output.message = out.stopreason

    output.xplus = out.xplus

    if not silent:
        print('Method: ODR')
        print(*out.stopreason)
        print('Residual variance:', output.residual_variance)

    if out.info > 3:
        raise Exception('The minimization procedure did not converge.')

    m = x_f.size

    def odr_chisquare(p):
        model = func(p[:n_parms], p[n_parms:].reshape(x_shape))
        chisq = anp.sum(((y_f - model) / dy_f) ** 2) + anp.sum(((x_f - p[n_parms:].reshape(x_shape)) / dx_f) ** 2)
        return chisq

    if kwargs.get('expected_chisquare') is True:
        W = np.diag(1 / np.asarray(np.concatenate((dy_f.ravel(), dx_f.ravel()))))

        if kwargs.get('covariance') is not None:
            cov = kwargs.get('covariance')
        else:
            cov = covariance(np.concatenate((y, x.ravel())))

        number_of_x_parameters = int(m / x_f.shape[-1])

        old_jac = jacobian(func)(out.beta, out.xplus)
        fused_row1 = np.concatenate((old_jac, np.concatenate((number_of_x_parameters * [np.zeros(old_jac.shape)]), axis=0)))
        fused_row2 = np.concatenate((jacobian(lambda x, y: func(y, x))(out.xplus, out.beta).reshape(x_f.shape[-1], x_f.shape[-1] * number_of_x_parameters), np.identity(number_of_x_parameters * old_jac.shape[0])))
        new_jac = np.concatenate((fused_row1, fused_row2), axis=1)

        A = W @ new_jac
        P_phi = A @ np.linalg.pinv(A.T @ A) @ A.T
        expected_chisquare = np.trace((np.identity(P_phi.shape[0]) - P_phi) @ W @ cov @ W)
        if expected_chisquare <= 0.0:
            warnings.warn("Negative expected_chisquare.", RuntimeWarning)
            expected_chisquare = np.abs(expected_chisquare)
        output.chisquare_by_expected_chisquare = odr_chisquare(np.concatenate((out.beta, out.xplus.ravel()))) / expected_chisquare
        if not silent:
            print('chisquare/expected_chisquare:',
                  output.chisquare_by_expected_chisquare)

    fitp = out.beta
    try:
        hess = hessian(odr_chisquare)(np.concatenate((fitp, out.xplus.ravel())))
    except TypeError:
        raise Exception("It is required to use autograd.numpy instead of numpy within fit functions, see the documentation for details.") from None

    def odr_chisquare_compact_x(d):
        model = func(d[:n_parms], d[n_parms:n_parms + m].reshape(x_shape))
        chisq = anp.sum(((y_f - model) / dy_f) ** 2) + anp.sum(((d[n_parms + m:].reshape(x_shape) - d[n_parms:n_parms + m].reshape(x_shape)) / dx_f) ** 2)
        return chisq

    jac_jac_x = hessian(odr_chisquare_compact_x)(np.concatenate((fitp, out.xplus.ravel(), x_f.ravel())))

    # Compute hess^{-1} @ jac_jac_x[:n_parms + m, n_parms + m:] using LAPACK dgesv
    try:
        deriv_x = -scipy.linalg.solve(hess, jac_jac_x[:n_parms + m, n_parms + m:])
    except np.linalg.LinAlgError:
        raise Exception("Cannot invert hessian matrix.")

    def odr_chisquare_compact_y(d):
        model = func(d[:n_parms], d[n_parms:n_parms + m].reshape(x_shape))
        chisq = anp.sum(((d[n_parms + m:] - model) / dy_f) ** 2) + anp.sum(((x_f - d[n_parms:n_parms + m].reshape(x_shape)) / dx_f) ** 2)
        return chisq

    jac_jac_y = hessian(odr_chisquare_compact_y)(np.concatenate((fitp, out.xplus.ravel(), y_f)))

    # Compute hess^{-1} @ jac_jac_y[:n_parms + m, n_parms + m:] using LAPACK dgesv
    try:
        deriv_y = -scipy.linalg.solve(hess, jac_jac_y[:n_parms + m, n_parms + m:])
    except np.linalg.LinAlgError:
        raise Exception("Cannot invert hessian matrix.")

    result = []
    for i in range(n_parms):
        result.append(derived_observable(lambda my_var, **kwargs: (my_var[0] + np.finfo(np.float64).eps) / (x.ravel()[0].value + np.finfo(np.float64).eps) * out.beta[i], list(x.ravel()) + list(y), man_grad=list(deriv_x[i]) + list(deriv_y[i])))

    output.fit_parameters = result

    output.odr_chisquare = odr_chisquare(np.concatenate((out.beta, out.xplus.ravel())))
    output.dof = x.shape[-1] - n_parms
    output.p_value = 1 - scipy.stats.chi2.cdf(output.odr_chisquare, output.dof)

    return output


def _prior_fit(x, y, func, priors, silent=False, **kwargs):
    output = Fit_result()

    output.fit_function = func

    x = np.asarray(x)

    if kwargs.get('num_grad') is True:
        hessian = num_hessian
    else:
        hessian = auto_hessian

    if not callable(func):
        raise TypeError('func has to be a function.')

    for i in range(100):
        try:
            func(np.arange(i), 0)
        except TypeError:
            continue
        except IndexError:
            continue
        else:
            break
    else:
        raise RuntimeError("Fit function is not valid.")

    n_parms = i

    if n_parms != len(priors):
        raise Exception('Priors does not have the correct length.')

    def extract_val_and_dval(string):
        split_string = string.split('(')
        if '.' in split_string[0] and '.' not in split_string[1][:-1]:
            factor = 10 ** -len(split_string[0].partition('.')[2])
        else:
            factor = 1
        return float(split_string[0]), float(split_string[1][:-1]) * factor

    loc_priors = []
    for i_n, i_prior in enumerate(priors):
        if isinstance(i_prior, Obs):
            loc_priors.append(i_prior)
        else:
            loc_val, loc_dval = extract_val_and_dval(i_prior)
            loc_priors.append(cov_Obs(loc_val, loc_dval ** 2, '#prior' + str(i_n) + f"_{np.random.randint(2147483647):010d}"))

    output.priors = loc_priors

    if not silent:
        print('Fit with', n_parms, 'parameter' + 's' * (n_parms > 1))

    y_f = [o.value for o in y]
    dy_f = [o.dvalue for o in y]

    if np.any(np.asarray(dy_f) <= 0.0):
        raise Exception('No y errors available, run the gamma method first.')

    p_f = [o.value for o in loc_priors]
    dp_f = [o.dvalue for o in loc_priors]

    if np.any(np.asarray(dp_f) <= 0.0):
        raise Exception('No prior errors available, run the gamma method first.')

    if 'initial_guess' in kwargs:
        x0 = kwargs.get('initial_guess')
        if len(x0) != n_parms:
            raise Exception('Initial guess does not have the correct length.')
    else:
        x0 = p_f

    def chisqfunc(p):
        model = func(p, x)
        chisq = anp.sum(((y_f - model) / dy_f) ** 2) + anp.sum(((p_f - p) / dp_f) ** 2)
        return chisq

    if not silent:
        print('Method: migrad')

    m = iminuit.Minuit(chisqfunc, x0)
    m.errordef = 1
    m.print_level = 0
    if 'tol' in kwargs:
        m.tol = kwargs.get('tol')
    else:
        m.tol = 1e-4
    m.migrad()
    params = np.asarray(m.values)

    output.chisquare_by_dof = m.fval / len(x)

    output.method = 'migrad'

    if not silent:
        print('chisquare/d.o.f.:', output.chisquare_by_dof)

    if not m.fmin.is_valid:
        raise Exception('The minimization procedure did not converge.')

    hess = hessian(chisqfunc)(params)
    hess_inv = np.linalg.pinv(hess)

    def chisqfunc_compact(d):
        model = func(d[:n_parms], x)
        chisq = anp.sum(((d[n_parms: n_parms + len(x)] - model) / dy_f) ** 2) + anp.sum(((d[n_parms + len(x):] - d[:n_parms]) / dp_f) ** 2)
        return chisq

    jac_jac = hessian(chisqfunc_compact)(np.concatenate((params, y_f, p_f)))

    deriv = -hess_inv @ jac_jac[:n_parms, n_parms:]

    result = []
    for i in range(n_parms):
        result.append(derived_observable(lambda x, **kwargs: (x[0] + np.finfo(np.float64).eps) / (y[0].value + np.finfo(np.float64).eps) * params[i], list(y) + list(loc_priors), man_grad=list(deriv[i])))

    output.fit_parameters = result
    output.chisquare = chisqfunc(np.asarray(params))

    if kwargs.get('resplot') is True:
        residual_plot(x, y, func, result)

    if kwargs.get('qqplot') is True:
        qqplot(x, y, func, result)

    return output


def _combined_fit(x, y, func, silent=False, **kwargs):

    output = Fit_result()

    if (type(x) == dict and type(y) == dict and type(func) == dict):
        xd = x
        yd = y
        funcd = func
        output.fit_function = func
    elif (type(x) == dict or type(y) == dict or type(func) == dict):
        raise TypeError("All arguments have to be dictionaries in order to perform a combined fit.")
    else:
        x = np.asarray(x)
        xd = {"": x}
        yd = {"": y}
        funcd = {"": func}
        output.fit_function = func

    if kwargs.get('num_grad') is True:
        jacobian = num_jacobian
        hessian = num_hessian
    else:
        jacobian = auto_jacobian
        hessian = auto_hessian

    key_ls = sorted(list(xd.keys()))

    if sorted(list(yd.keys())) != key_ls:
        raise Exception('x and y dictionaries do not contain the same keys.')

    if sorted(list(funcd.keys())) != key_ls:
        raise Exception('x and func dictionaries do not contain the same keys.')

    x_all = np.concatenate([np.array(xd[key]) for key in key_ls])
    y_all = np.concatenate([np.array(yd[key]) for key in key_ls])

    y_f = [o.value for o in y_all]
    dy_f = [o.dvalue for o in y_all]

    if len(x_all.shape) > 2:
        raise Exception('Unknown format for x values')

    if np.any(np.asarray(dy_f) <= 0.0):
        raise Exception('No y errors available, run the gamma method first.')

    # number of fit parameters
    n_parms_ls = []
    for key in key_ls:
        if not callable(funcd[key]):
            raise TypeError('func (key=' + key + ') is not a function.')
        if np.asarray(xd[key]).shape[-1] != len(yd[key]):
            raise Exception('x and y input (key=' + key + ') do not have the same length')
        for i in range(100):
            try:
                funcd[key](np.arange(i), x_all.T[0])
            except TypeError:
                continue
            except IndexError:
                continue
            else:
                break
        else:
            raise RuntimeError("Fit function (key=" + key + ") is not valid.")
        n_parms = i
        n_parms_ls.append(n_parms)
    n_parms = max(n_parms_ls)
    if not silent:
        print('Fit with', n_parms, 'parameter' + 's' * (n_parms > 1))

    if 'initial_guess' in kwargs:
        x0 = kwargs.get('initial_guess')
        if len(x0) != n_parms:
            raise Exception('Initial guess does not have the correct length: %d vs. %d' % (len(x0), n_parms))
    else:
        x0 = [0.1] * n_parms

    def general_chisqfunc_uncorr(p, ivars):
        model = anp.concatenate([anp.array(funcd[key](p, anp.asarray(xd[key]))).reshape(-1) for key in key_ls])
        return ((ivars - model) / dy_f)

    def chisqfunc_uncorr(p):
        return anp.sum(general_chisqfunc_uncorr(p, y_f) ** 2)

    if kwargs.get('correlated_fit') is True:
        corr = covariance(y_all, correlation=True, **kwargs)
        covdiag = np.diag(1 / np.asarray(dy_f))
        condn = np.linalg.cond(corr)
        if condn > 0.1 / np.finfo(float).eps:
            raise Exception(f"Cannot invert correlation matrix as its condition number exceeds machine precision ({condn:1.2e})")
        if condn > 1e13:
            warnings.warn("Correlation matrix may be ill-conditioned, condition number: {%1.2e}" % (condn), RuntimeWarning)
        chol = np.linalg.cholesky(corr)
        chol_inv = scipy.linalg.solve_triangular(chol, covdiag, lower=True)

        def general_chisqfunc(p, ivars):
            model = anp.concatenate([anp.array(funcd[key](p, anp.asarray(xd[key]))).reshape(-1) for key in key_ls])
            return anp.dot(chol_inv, (ivars - model))

        def chisqfunc(p):
            return anp.sum(general_chisqfunc(p, y_f) ** 2)
    else:
        general_chisqfunc = general_chisqfunc_uncorr
        chisqfunc = chisqfunc_uncorr

    output.method = kwargs.get('method', 'Levenberg-Marquardt')
    if not silent:
        print('Method:', output.method)

    if output.method != 'Levenberg-Marquardt':
        if output.method == 'migrad':
            tolerance = 1e-4  # default value of 1e-1 set by iminuit can be problematic
            if 'tol' in kwargs:
                tolerance = kwargs.get('tol')
            fit_result = iminuit.minimize(chisqfunc_uncorr, x0, tol=tolerance)  # Stopping criterion 0.002 * tol * errordef
            if kwargs.get('correlated_fit') is True:
                fit_result = iminuit.minimize(chisqfunc, fit_result.x, tol=tolerance)
            output.iterations = fit_result.nfev
        else:
            tolerance = 1e-12
            if 'tol' in kwargs:
                tolerance = kwargs.get('tol')
            fit_result = scipy.optimize.minimize(chisqfunc_uncorr, x0, method=kwargs.get('method'), tol=tolerance)
            if kwargs.get('correlated_fit') is True:
                fit_result = scipy.optimize.minimize(chisqfunc, fit_result.x, method=kwargs.get('method'), tol=tolerance)
            output.iterations = fit_result.nit

        chisquare = fit_result.fun

    else:
        if 'tol' in kwargs:
            print('tol cannot be set for Levenberg-Marquardt')

        def chisqfunc_residuals_uncorr(p):
            return general_chisqfunc_uncorr(p, y_f)

        fit_result = scipy.optimize.least_squares(chisqfunc_residuals_uncorr, x0, method='lm', ftol=1e-15, gtol=1e-15, xtol=1e-15)
        if kwargs.get('correlated_fit') is True:

            def chisqfunc_residuals(p):
                return general_chisqfunc(p, y_f)

            fit_result = scipy.optimize.least_squares(chisqfunc_residuals, fit_result.x, method='lm', ftol=1e-15, gtol=1e-15, xtol=1e-15)

        chisquare = np.sum(fit_result.fun ** 2)
        assert np.isclose(chisquare, chisqfunc(fit_result.x), atol=1e-14)

        output.iterations = fit_result.nfev

    if not fit_result.success:
        raise Exception('The minimization procedure did not converge.')

    if x_all.shape[-1] - n_parms > 0:
        output.chisquare = chisquare
        output.dof = x_all.shape[-1] - n_parms
        output.chisquare_by_dof = output.chisquare / output.dof
        output.p_value = 1 - scipy.stats.chi2.cdf(output.chisquare, output.dof)
    else:
        output.chisquare_by_dof = float('nan')

    output.message = fit_result.message
    if not silent:
        print(fit_result.message)
        print('chisquare/d.o.f.:', output.chisquare_by_dof)
        print('fit parameters', fit_result.x)

    def prepare_hat_matrix():
        hat_vector = []
        for key in key_ls:
            x_array = np.asarray(xd[key])
            if (len(x_array) != 0):
                hat_vector.append(jacobian(funcd[key])(fit_result.x, x_array))
        hat_vector = [item for sublist in hat_vector for item in sublist]
        return hat_vector

    if kwargs.get('expected_chisquare') is True:
        if kwargs.get('correlated_fit') is not True:
            W = np.diag(1 / np.asarray(dy_f))
            cov = covariance(y_all)
            hat_vector = prepare_hat_matrix()
            A = W @ hat_vector
            P_phi = A @ np.linalg.pinv(A.T @ A) @ A.T
            expected_chisquare = np.trace((np.identity(x_all.shape[-1]) - P_phi) @ W @ cov @ W)
            output.chisquare_by_expected_chisquare = output.chisquare / expected_chisquare
            if not silent:
                print('chisquare/expected_chisquare:', output.chisquare_by_expected_chisquare)

    fitp = fit_result.x
    if np.any(np.asarray(dy_f) <= 0.0):
        raise Exception('No y errors available, run the gamma method first.')

    try:
        hess = hessian(chisqfunc)(fitp)
    except TypeError:
        raise Exception("It is required to use autograd.numpy instead of numpy within fit functions, see the documentation for details.") from None

    def chisqfunc_compact(d):
        return anp.sum(general_chisqfunc(d[:n_parms], d[n_parms:]) ** 2)

    jac_jac_y = hessian(chisqfunc_compact)(np.concatenate((fitp, y_f)))

    # Compute hess^{-1} @ jac_jac_y[:n_parms + m, n_parms + m:] using LAPACK dgesv
    try:
        deriv_y = -scipy.linalg.solve(hess, jac_jac_y[:n_parms, n_parms:])
    except np.linalg.LinAlgError:
        raise Exception("Cannot invert hessian matrix.")

    result = []
    for i in range(n_parms):
        result.append(derived_observable(lambda x_all, **kwargs: (x_all[0] + np.finfo(np.float64).eps) / (y_all[0].value + np.finfo(np.float64).eps) * fitp[i], list(y_all), man_grad=list(deriv_y[i])))

    output.fit_parameters = result

    # Hotelling t-squared p-value for correlated fits.
    if kwargs.get('correlated_fit') is True:
        n_cov = np.min(np.vectorize(lambda x_all: x_all.N)(y_all))
        output.t2_p_value = 1 - scipy.stats.f.cdf((n_cov - output.dof) / (output.dof * (n_cov - 1)) * output.chisquare,
                                                  output.dof, n_cov - output.dof)

    if kwargs.get('resplot') is True:
        for key in key_ls:
            residual_plot(xd[key], yd[key], funcd[key], result, title=key)

    if kwargs.get('qqplot') is True:
        for key in key_ls:
            qqplot(xd[key], yd[key], funcd[key], result, title=key)

    return output


def fit_lin(x, y, **kwargs):
    """Performs a linear fit to y = n + m * x and returns two Obs n, m.

    Parameters
    ----------
    x : list
        Can either be a list of floats in which case no xerror is assumed, or
        a list of Obs, where the dvalues of the Obs are used as xerror for the fit.
    y : list
        List of Obs, the dvalues of the Obs are used as yerror for the fit.

    Returns
    -------
    fit_parameters : list[Obs]
        LIist of fitted observables.
    """

    def f(a, x):
        y = a[0] + a[1] * x
        return y

    if all(isinstance(n, Obs) for n in x):
        out = total_least_squares(x, y, f, **kwargs)
        return out.fit_parameters
    elif all(isinstance(n, float) or isinstance(n, int) for n in x) or isinstance(x, np.ndarray):
        out = least_squares(x, y, f, **kwargs)
        return out.fit_parameters
    else:
        raise Exception('Unsupported types for x')


def qqplot(x, o_y, func, p, title=""):
    """Generates a quantile-quantile plot of the fit result which can be used to
       check if the residuals of the fit are gaussian distributed.

    Returns
    -------
    None
    """

    residuals = []
    for i_x, i_y in zip(x, o_y):
        residuals.append((i_y - func(p, i_x)) / i_y.dvalue)
    residuals = sorted(residuals)
    my_y = [o.value for o in residuals]
    probplot = scipy.stats.probplot(my_y)
    my_x = probplot[0][0]
    plt.figure(figsize=(8, 8 / 1.618))
    plt.errorbar(my_x, my_y, fmt='o')
    fit_start = my_x[0]
    fit_stop = my_x[-1]
    samples = np.arange(fit_start, fit_stop, 0.01)
    plt.plot(samples, samples, 'k--', zorder=11, label='Standard normal distribution')
    plt.plot(samples, probplot[1][0] * samples + probplot[1][1], zorder=10, label='Least squares fit, r=' + str(np.around(probplot[1][2], 3)), marker='', ls='-')

    plt.xlabel('Theoretical quantiles')
    plt.ylabel('Ordered Values')
    plt.legend(title=title)
    plt.draw()


def residual_plot(x, y, func, fit_res, title=""):
    """Generates a plot which compares the fit to the data and displays the corresponding residuals

    For uncorrelated data the residuals are expected to be distributed ~N(0,1).

    Returns
    -------
    None
    """
    sorted_x = sorted(x)
    xstart = sorted_x[0] - 0.5 * (sorted_x[1] - sorted_x[0])
    xstop = sorted_x[-1] + 0.5 * (sorted_x[-1] - sorted_x[-2])
    x_samples = np.arange(xstart, xstop + 0.01, 0.01)

    plt.figure(figsize=(8, 8 / 1.618))
    gs = gridspec.GridSpec(2, 1, height_ratios=[3, 1], wspace=0.0, hspace=0.0)
    ax0 = plt.subplot(gs[0])
    ax0.errorbar(x, [o.value for o in y], yerr=[o.dvalue for o in y], ls='none', fmt='o', capsize=3, markersize=5, label='Data')
    ax0.plot(x_samples, func([o.value for o in fit_res], x_samples), label='Fit', zorder=10, ls='-', ms=0)
    ax0.set_xticklabels([])
    ax0.set_xlim([xstart, xstop])
    ax0.set_xticklabels([])
    ax0.legend(title=title)

    residuals = (np.asarray([o.value for o in y]) - func([o.value for o in fit_res], x)) / np.asarray([o.dvalue for o in y])
    ax1 = plt.subplot(gs[1])
    ax1.plot(x, residuals, 'ko', ls='none', markersize=5)
    ax1.tick_params(direction='out')
    ax1.tick_params(axis="x", bottom=True, top=True, labelbottom=True)
    ax1.axhline(y=0.0, ls='--', color='k', marker=" ")
    ax1.fill_between(x_samples, -1.0, 1.0, alpha=0.1, facecolor='k')
    ax1.set_xlim([xstart, xstop])
    ax1.set_ylabel('Residuals')
    plt.subplots_adjust(wspace=None, hspace=None)
    plt.draw()


def error_band(x, func, beta):
    """Calculate the error band for an array of sample values x, for given fit function func with optimized parameters beta.

    Returns
    -------
    err : np.array(Obs)
        Error band for an array of sample values x
    """
    cov = covariance(beta)
    if np.any(np.abs(cov - cov.T) > 1000 * np.finfo(np.float64).eps):
        warnings.warn("Covariance matrix is not symmetric within floating point precision", RuntimeWarning)

    deriv = []
    for i, item in enumerate(x):
        deriv.append(np.array(egrad(func)([o.value for o in beta], item)))

    err = []
    for i, item in enumerate(x):
        err.append(np.sqrt(deriv[i] @ cov @ deriv[i]))
    err = np.array(err)

    return err


def ks_test(objects=None):
    """Performs a Kolmogorov–Smirnov test for the p-values of all fit object.

    Parameters
    ----------
    objects : list
        List of fit results to include in the analysis (optional).

    Returns
    -------
    None
    """

    if objects is None:
        obs_list = []
        for obj in gc.get_objects():
            if isinstance(obj, Fit_result):
                obs_list.append(obj)
    else:
        obs_list = objects

    p_values = [o.p_value for o in obs_list]

    bins = len(p_values)
    x = np.arange(0, 1.001, 0.001)
    plt.plot(x, x, 'k', zorder=1)
    plt.xlim(0, 1)
    plt.ylim(0, 1)
    plt.xlabel('p-value')
    plt.ylabel('Cumulative probability')
    plt.title(str(bins) + ' p-values')

    n = np.arange(1, bins + 1) / np.float64(bins)
    Xs = np.sort(p_values)
    plt.step(Xs, n)
    diffs = n - Xs
    loc_max_diff = np.argmax(np.abs(diffs))
    loc = Xs[loc_max_diff]
    plt.annotate('', xy=(loc, loc), xytext=(loc, loc + diffs[loc_max_diff]), arrowprops=dict(arrowstyle='<->', shrinkA=0, shrinkB=0))
    plt.draw()

    print(scipy.stats.kstest(p_values, 'uniform'))
-												feat: Automated Kolmogorov Smirnov test for fit p-values added

											
										
										
											2022-01-10 15:17:55 +01:00
+								import gc
-												Fit_result now inherits from sequence

											
										
										
											2021-11-01 14:21:39 +00:00
+								from collections.abc import Sequence
-												Warning messages promoted to RuntimeWarnings

											
										
										
											2021-10-15 12:11:06 +01:00
+								import warnings
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								import numpy as np
 								import autograd.numpy as anp
 								import scipy.optimize
 								import scipy.stats
 								import matplotlib.pyplot as plt
 								from matplotlib import gridspec
 								from scipy.odr import ODR, Model, RealData
 								import iminuit
-												feat: least_squares fit error propagation can now also be performed via
numerical derivatives.

											
										
										
											2022-10-05 17:44:38 +01:00
+								from autograd import jacobian as auto_jacobian
-												feat: double jacobian in standard fit replaced by hessian

This greatly improves performance for numerical derivatives and helps
with readability.

											
										
										
											2022-10-06 10:44:06 +01:00
+								from autograd import hessian as auto_hessian
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								from autograd import elementwise_grad as egrad
-												feat: least_squares fit error propagation can now also be performed via
numerical derivatives.

											
										
										
											2022-10-05 17:44:38 +01:00
+								from numdifftools import Jacobian as num_jacobian
-												feat: double jacobian in standard fit replaced by hessian

This greatly improves performance for numerical derivatives and helps
with readability.

											
										
										
											2022-10-06 10:44:06 +01:00
+								from numdifftools import Hessian as num_hessian
-												feat: priors in fits replaced by covobs, random hash added to avoid
prior collisions.

											
										
										
											2021-12-09 12:36:28 +00:00
+								from .obs import Obs, derived_observable, covariance, cov_Obs
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												Fit_result now inherits from sequence

											
										
										
											2021-11-01 14:21:39 +00:00
+								class Fit_result(Sequence):
-												docstrings extended

											
										
										
											2021-11-01 14:41:57 +00:00
+								    """Represents fit results.
 								    Attributes
 								    ----------
 								    fit_parameters : list
 								        results for the individual fit parameters,
-												docs: typos in docstrings corrected

											
										
										
											2021-11-15 11:13:12 +00:00
+								        also accessible via indices.
-												feat: Hotelling t-squared p-value for correlated fits added.

											
										
										
											2022-12-06 17:17:03 +00:00
+								    chisquare_by_dof : float
 								        reduced chisquare.
 								    p_value : float
 								        p-value of the fit
 								    t2_p_value : float
 								        Hotelling t-squared p-value for correlated fits.
-												docstrings extended

											
										
										
											2021-11-01 14:41:57 +00:00
+								    """
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
 								    def __init__(self):
 								        self.fit_parameters = None
-												Fit_result now inherits from sequence

											
										
										
											2021-11-01 14:21:39 +00:00
+								    def __getitem__(self, idx):
 								        return self.fit_parameters[idx]
 								    def __len__(self):
 								        return len(self.fit_parameters)
-												fix: Fit_result.gamma_method can now be called with kwargs

											
										
										
											2022-06-06 15:04:16 +01:00
+								    def gamma_method(self, **kwargs):
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        """Apply the gamma method to all fit parameters"""
-												fix: Fit_result.gamma_method can now be called with kwargs

											
										
										
											2022-06-06 15:04:16 +01:00
+								        [o.gamma_method(**kwargs) for o in self.fit_parameters]
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
-												feat: gm alias for gamma_method also added to other classes.

											
										
										
											2023-01-13 17:26:52 +00:00
+								    gm = gamma_method
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								    def __str__(self):
-												Fit_result now inherits from sequence

											
										
										
											2021-11-01 14:21:39 +00:00
+								        my_str = 'Goodness of fit:\n'
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        if hasattr(self, 'chisquare_by_dof'):
 								            my_str += '\u03C7\u00b2/d.o.f. = ' + f'{self.chisquare_by_dof:2.6f}' + '\n'
 								        elif hasattr(self, 'residual_variance'):
 								            my_str += 'residual variance = ' + f'{self.residual_variance:2.6f}' + '\n'
 								        if hasattr(self, 'chisquare_by_expected_chisquare'):
-												Fit_result now inherits from sequence

											
										
										
											2021-11-01 14:21:39 +00:00
+								            my_str += '\u03C7\u00b2/\u03C7\u00b2exp  = ' + f'{self.chisquare_by_expected_chisquare:2.6f}' + '\n'
-												feat: p-value calculation added to fit functions and fit result object

											
										
										
											2022-01-10 15:00:47 +01:00
+								        if hasattr(self, 'p_value'):
 								            my_str += 'p-value   = ' + f'{self.p_value:2.4f}' + '\n'
-												feat: Hotelling t-squared p-value for correlated fits added.

											
										
										
											2022-12-06 17:17:03 +00:00
+								        if hasattr(self, 't2_p_value'):
 								            my_str += 't\u00B2p-value = ' + f'{self.t2_p_value:2.4f}' + '\n'
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        my_str += 'Fit parameters:\n'
 								        for i_par, par in enumerate(self.fit_parameters):
-												Fit_result now inherits from sequence

											
										
										
											2021-11-01 14:21:39 +00:00
+								            my_str += str(i_par) + '\t' + ' ' * int(par >= 0) + str(par).rjust(int(par < 0.0)) + '\n'
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        return my_str
 								    def __repr__(self):
-												repr of fit result adjusted

											
										
										
											2021-11-01 15:03:39 +00:00
+								        m = max(map(len, list(self.__dict__.keys()))) + 1
 								        return '\n'.join([key.rjust(m) + ': ' + repr(value) for key, value in sorted(self.__dict__.items())])
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
-												least_squares function introduced

											
										
										
											2021-11-01 11:49:57 +00:00
+								def least_squares(x, y, func, priors=None, silent=False, **kwargs):
-												least_squares docstring updated

											
										
										
											2021-11-08 10:01:26 +00:00
+								    r'''Performs a non-linear fit to y = func(x).
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        ```
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												docstrings updated

											
										
										
											2021-11-07 21:44:22 +00:00
+								    Parameters
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								    ----------
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    For an uncombined fit:
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								    x : list
 								        list of floats.
 								    y : list
 								        list of Obs.
 								    func : object
 								        fit function, has to be of the form
-												least_squares docstring updated

											
										
										
											2021-11-08 10:01:26 +00:00
+								        ```python
-												docs: documentation of error propagation for iterative algorithms
extended.

											
										
										
											2022-02-14 14:06:46 +00:00
+								        import autograd.numpy as anp
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								        def func(a, x):
-												docs: documentation of error propagation for iterative algorithms
extended.

											
										
										
											2022-02-14 14:06:46 +00:00
+								            return a[0] + a[1] * x + a[2] * anp.sinh(x)
-												least_squares docstring updated

											
										
										
											2021-11-08 10:01:26 +00:00
+								        ```
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
 								        For multiple x values func can be of the form
-												least_squares docstring updated

											
										
										
											2021-11-08 10:01:26 +00:00
+								        ```python
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								        def func(a, x):
 								            (x1, x2) = x
 								            return a[0] * x1 ** 2 + a[1] * x2
-												least_squares docstring updated

											
										
										
											2021-11-08 10:01:26 +00:00
+								        ```
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								        It is important that all numpy functions refer to autograd.numpy, otherwise the differentiation
-												docs: documentation of covariance and correlated fits extended.

											
										
										
											2022-03-05 08:13:24 +00:00
+								        will not work.
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    OR For a combined fit:
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												clean-up

											
										
										
											2022-12-16 18:55:43 +01:00
+								    x : dict
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        dict of lists.
-												clean-up

											
										
										
											2022-12-16 18:55:43 +01:00
+								    y : dict
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        dict of lists of Obs.
-												clean-up

											
										
										
											2022-12-16 18:55:43 +01:00
+								    funcs : dict
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        dict of objects
 								        fit functions have to be of the form (here a[0] is the common fit parameter)
 								        ```python
 								        import autograd.numpy as anp
 								        funcs = {"a": func_a,
 								                "b": func_b}
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        def func_a(a, x):
 								            return a[1] * anp.exp(-a[0] * x)
 								        def func_b(a, x):
 								            return a[2] * anp.exp(-a[0] * x)
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
 								        It is important that all numpy functions refer to autograd.numpy, otherwise the differentiation
-												docs: documentation of covariance and correlated fits extended.

											
										
										
											2022-03-05 08:13:24 +00:00
+								        will not work.
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								    priors : list, optional
 								        priors has to be a list with an entry for every parameter in the fit. The entries can either be
 								        Obs (e.g. results from a previous fit) or strings containing a value and an error formatted like
 .548(23), 500(40) or 0.5(0.4)
 								    silent : bool, optional
 								        If true all output to the console is omitted (default False).
-												docstrings updated

											
										
										
											2021-11-07 21:44:22 +00:00
+								    initial_guess : list
 								        can provide an initial guess for the input parameters. Relevant for
-												docs: Docstring for fits.least_square extended.

											
										
										
											2022-05-31 11:51:59 +01:00
+								        non-linear fits with many parameters. In case of correlated fits the guess is used to perform
 								        an uncorrelated fit which then serves as guess for the correlated fit.
-												refactor: Classification of fit method in fits.least_squares simplified,
precision of imiunit solver adjusted, prefitting for alternative methods
removed.

											
										
										
											2022-02-02 10:05:48 +00:00
+								    method : str, optional
-												docstrings updated

											
										
										
											2021-11-07 21:44:22 +00:00
+								        can be used to choose an alternative method for the minimization of chisquare.
 								        The possible methods are the ones which can be used for scipy.optimize.minimize and
 								        migrad of iminuit. If no method is specified, Levenberg-Marquard is used.
 								        Reliable alternatives are migrad, Powell and Nelder-Mead.
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								    tol: float, optional
-												fix/tests: Combined fit now also works when the keys of the x,y & func input dictionaries are not in the same order, build: improvements in performance

											
										
										
											2023-01-30 14:26:47 +01:00
+								        can be used (only for combined fits and methods other than Levenberg-Marquard) to set the tolerance for convergence
 								        to a different value to either speed up convergence at the cost of a larger error on the fitted parameters (and possibly
 								        invalid estimates for parameter uncertainties) or smaller values to get more accurate parameter values
 								        The stopping criterion depends on the method, e.g. migrad: edm_max = 0.002 * tol * errordef (EDM criterion: edm < edm_max)
-												docs: documentation of covariance and correlated fits extended.

											
										
										
											2022-03-05 08:13:24 +00:00
+								    correlated_fit : bool
 								        If True, use the full inverse covariance matrix in the definition of the chisquare cost function.
 								        For details about how the covariance matrix is estimated see `pyerrors.obs.covariance`.
 								        In practice the correlation matrix is Cholesky decomposed and inverted (instead of the covariance matrix).
 								        This procedure should be numerically more stable as the correlation matrix is typically better conditioned (Jacobi preconditioning).
 								        At the moment this option only works for `prior==None` and when no `method` is given.
 								    expected_chisquare : bool
 								        If True estimates the expected chisquare which is
 								        corrected by effects caused by correlated input data (default False).
-												docstrings updated

											
										
										
											2021-11-07 21:44:22 +00:00
+								    resplot : bool
-												docs: documentation of covariance and correlated fits extended.

											
										
										
											2022-03-05 08:13:24 +00:00
+								        If True, a plot which displays fit, data and residuals is generated (default False).
-												docstrings updated

											
										
										
											2021-11-07 21:44:22 +00:00
+								    qqplot : bool
-												docs: documentation of covariance and correlated fits extended.

											
										
										
											2022-03-05 08:13:24 +00:00
+								        If True, a quantile-quantile plot of the fit result is generated (default False).
-												feat: least_squares fit error propagation can now also be performed via
numerical derivatives.

											
										
										
											2022-10-05 17:44:38 +01:00
+								    num_grad : bool
 								        Use numerical differentation instead of automatic differentiation to perform the error propagation (default False).
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
 								    Returns
 								    -------
 								    output : Fit_result
 								        Parameters and information on the fitted result.
-												least_squares docstring updated

											
										
										
											2021-11-08 10:01:26 +00:00
+								    '''
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								    if priors is not None:
 								        return _prior_fit(x, y, func, priors, silent=silent, **kwargs)
 								    else:
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								        return _combined_fit(x, y, func, silent=silent, **kwargs)
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
-												odr_fit renamed, deprecation warning added

least_squares and total_least_squares are now available to the top level
namespace

											
										
										
											2021-11-01 12:01:46 +00:00
+								def total_least_squares(x, y, func, silent=False, **kwargs):
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
+								    r'''Performs a non-linear fit to y = func(x) and returns a list of Obs corresponding to the fit parameters.
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												docstrings updated

											
										
										
											2021-11-07 21:44:22 +00:00
+								    Parameters
 								    ----------
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								    x : list
 								        list of Obs, or a tuple of lists of Obs
 								    y : list
 								        list of Obs. The dvalues of the Obs are used as x- and yerror for the fit.
 								    func : object
 								        func has to be of the form
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
+								        ```python
-												docs: documentation of error propagation for iterative algorithms
extended.

											
										
										
											2022-02-14 14:06:46 +00:00
+								        import autograd.numpy as anp
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								        def func(a, x):
-												docs: documentation of error propagation for iterative algorithms
extended.

											
										
										
											2022-02-14 14:06:46 +00:00
+								            return a[0] + a[1] * x + a[2] * anp.sinh(x)
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
+								        ```
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								        For multiple x values func can be of the form
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
+								        ```python
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								        def func(a, x):
 								            (x1, x2) = x
 								            return a[0] * x1 ** 2 + a[1] * x2
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
+								        ```
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								        It is important that all numpy functions refer to autograd.numpy, otherwise the differentiation
 								        will not work.
 								    silent : bool, optional
 								        If true all output to the console is omitted (default False).
-												docstrings updated

											
										
										
											2021-11-07 21:44:22 +00:00
+								    initial_guess : list
 								        can provide an initial guess for the input parameters. Relevant for non-linear
 								        fits with many parameters.
 								    expected_chisquare : bool
 								        If true prints the expected chisquare which is
 								        corrected by effects caused by correlated input data.
 								        This can take a while as the full correlation matrix
 								        has to be calculated (default False).
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								    num_grad : bool
 								        Use numerical differentation instead of automatic differentiation to perform the error propagation (default False).
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
-												docs: formatting of docstrings improved.

											
										
										
											2022-03-05 08:43:57 +00:00
+								    Notes
 								    -----
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
+								    Based on the orthogonal distance regression module of scipy.
 								    Returns
 								    -------
 								    output : Fit_result
 								        Parameters and information on the fitted result.
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
+								    '''
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output = Fit_result()
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.fit_function = func
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    x = np.array(x)
 								    x_shape = x.shape
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								    if kwargs.get('num_grad') is True:
 								        jacobian = num_jacobian
 								        hessian = num_hessian
 								    else:
 								        jacobian = auto_jacobian
 								        hessian = auto_hessian
-												feat: least_squares fit error propagation can now also be performed via
numerical derivatives.

											
										
										
											2022-10-05 17:44:38 +01:00
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    if not callable(func):
 								        raise TypeError('func has to be a function.')
-												fix: detection of invalid fit functions extended.

											
										
										
											2022-06-24 12:50:26 +01:00
+								    for i in range(42):
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        try:
 								            func(np.arange(i), x.T[0])
-												refactor: Unused variable in fit function detection removed.

											
										
										
											2022-06-24 13:12:53 +01:00
+								        except TypeError:
 								            continue
 								        except IndexError:
-												fix: detection of invalid fit functions extended.

											
										
										
											2022-06-24 12:50:26 +01:00
+								            continue
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        else:
 								            break
-												fix: detection of invalid fit functions extended.

											
										
										
											2022-06-24 12:50:26 +01:00
+								    else:
 								        raise RuntimeError("Fit function is not valid.")
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    n_parms = i
 								    if not silent:
-												feat: stdout of fit routines improved

											
										
										
											2022-01-24 13:22:35 +00:00
+								        print('Fit with', n_parms, 'parameter' + 's' * (n_parms > 1))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    x_f = np.vectorize(lambda o: o.value)(x)
 								    dx_f = np.vectorize(lambda o: o.dvalue)(x)
 								    y_f = np.array([o.value for o in y])
 								    dy_f = np.array([o.dvalue for o in y])
 								    if np.any(np.asarray(dx_f) <= 0.0):
 								        raise Exception('No x errors available, run the gamma method first.')
 								    if np.any(np.asarray(dy_f) <= 0.0):
 								        raise Exception('No y errors available, run the gamma method first.')
 								    if 'initial_guess' in kwargs:
 								        x0 = kwargs.get('initial_guess')
 								        if len(x0) != n_parms:
-												Added the possibility to use constrained fit parameters. Added correlated least squares.

											
										
										
											2021-11-15 16:39:50 +01:00
+								            raise Exception('Initial guess does not have the correct length: %d vs. %d' % (len(x0), n_parms))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    else:
 								        x0 = [1] * n_parms
 								    data = RealData(x_f, y_f, sx=dx_f, sy=dy_f)
 								    model = Model(func)
-												further instances of np.float removed

											
										
										
											2021-10-12 14:12:21 +01:00
+								    odr = ODR(data, model, x0, partol=np.finfo(np.float64).eps)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    odr.set_job(fit_type=0, deriv=1)
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								    out = odr.run()
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								    output.residual_variance = out.res_var
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.method = 'ODR'
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												least_squares function introduced

											
										
										
											2021-11-01 11:49:57 +00:00
+								    output.message = out.stopreason
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								    output.xplus = out.xplus
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    if not silent:
 								        print('Method: ODR')
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        print(*out.stopreason)
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								        print('Residual variance:', output.residual_variance)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								    if out.info > 3:
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        raise Exception('The minimization procedure did not converge.')
 								    m = x_f.size
 								    def odr_chisquare(p):
 								        model = func(p[:n_parms], p[n_parms:].reshape(x_shape))
 								        chisq = anp.sum(((y_f - model) / dy_f) ** 2) + anp.sum(((x_f - p[n_parms:].reshape(x_shape)) / dx_f) ** 2)
 								        return chisq
 								    if kwargs.get('expected_chisquare') is True:
 								        W = np.diag(1 / np.asarray(np.concatenate((dy_f.ravel(), dx_f.ravel()))))
 								        if kwargs.get('covariance') is not None:
 								            cov = kwargs.get('covariance')
 								        else:
-												feat: positive semi-definite estimator for the covariance implemented,
fits.covariance matrix deprecated, covariance can now handle lists of
observables.

											
										
										
											2022-03-01 09:45:25 +00:00
+								            cov = covariance(np.concatenate((y, x.ravel())))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								        number_of_x_parameters = int(m / x_f.shape[-1])
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        old_jac = jacobian(func)(out.beta, out.xplus)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        fused_row1 = np.concatenate((old_jac, np.concatenate((number_of_x_parameters * [np.zeros(old_jac.shape)]), axis=0)))
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        fused_row2 = np.concatenate((jacobian(lambda x, y: func(y, x))(out.xplus, out.beta).reshape(x_f.shape[-1], x_f.shape[-1] * number_of_x_parameters), np.identity(number_of_x_parameters * old_jac.shape[0])))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        new_jac = np.concatenate((fused_row1, fused_row2), axis=1)
 								        A = W @ new_jac
-												fix: replaced inverse by the pseudo inverse in the calculation of
chi_exp

											
										
										
											2022-03-03 18:29:18 +00:00
+								        P_phi = A @ np.linalg.pinv(A.T @ A) @ A.T
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        expected_chisquare = np.trace((np.identity(P_phi.shape[0]) - P_phi) @ W @ cov @ W)
 								        if expected_chisquare <= 0.0:
-												Warning messages promoted to RuntimeWarnings

											
										
										
											2021-10-15 12:11:06 +01:00
+								            warnings.warn("Negative expected_chisquare.", RuntimeWarning)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								            expected_chisquare = np.abs(expected_chisquare)
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								        output.chisquare_by_expected_chisquare = odr_chisquare(np.concatenate((out.beta, out.xplus.ravel()))) / expected_chisquare
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        if not silent:
 								            print('chisquare/expected_chisquare:',
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								                  output.chisquare_by_expected_chisquare)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												refactor!: const_par keyword for constrained fits removed from functions
in fit module.

											
										
										
											2022-01-24 17:43:23 +00:00
+								    fitp = out.beta
-												fix: no-autograd exception in fits works again.

											
										
										
											2022-05-25 14:51:46 +01:00
+								    try:
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								        hess = hessian(odr_chisquare)(np.concatenate((fitp, out.xplus.ravel())))
-												fix: no-autograd exception in fits works again.

											
										
										
											2022-05-25 14:51:46 +01:00
+								    except TypeError:
 								        raise Exception("It is required to use autograd.numpy instead of numpy within fit functions, see the documentation for details.") from None
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    def odr_chisquare_compact_x(d):
-												refactor!: const_par keyword for constrained fits removed from functions
in fit module.

											
										
										
											2022-01-24 17:43:23 +00:00
+								        model = func(d[:n_parms], d[n_parms:n_parms + m].reshape(x_shape))
 								        chisq = anp.sum(((y_f - model) / dy_f) ** 2) + anp.sum(((d[n_parms + m:].reshape(x_shape) - d[n_parms:n_parms + m].reshape(x_shape)) / dx_f) ** 2)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        return chisq
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								    jac_jac_x = hessian(odr_chisquare_compact_x)(np.concatenate((fitp, out.xplus.ravel(), x_f.ravel())))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												feat: optimized calculation of the inverse hessian for error propagation
in fits.

											
										
										
											2022-05-26 10:19:39 +01:00
+								    # Compute hess^{-1} @ jac_jac_x[:n_parms + m, n_parms + m:] using LAPACK dgesv
 								    try:
 								        deriv_x = -scipy.linalg.solve(hess, jac_jac_x[:n_parms + m, n_parms + m:])
 								    except np.linalg.LinAlgError:
 								        raise Exception("Cannot invert hessian matrix.")
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    def odr_chisquare_compact_y(d):
-												refactor!: const_par keyword for constrained fits removed from functions
in fit module.

											
										
										
											2022-01-24 17:43:23 +00:00
+								        model = func(d[:n_parms], d[n_parms:n_parms + m].reshape(x_shape))
 								        chisq = anp.sum(((d[n_parms + m:] - model) / dy_f) ** 2) + anp.sum(((x_f - d[n_parms:n_parms + m].reshape(x_shape)) / dx_f) ** 2)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        return chisq
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								    jac_jac_y = hessian(odr_chisquare_compact_y)(np.concatenate((fitp, out.xplus.ravel(), y_f)))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												feat: optimized calculation of the inverse hessian for error propagation
in fits.

											
										
										
											2022-05-26 10:19:39 +01:00
+								    # Compute hess^{-1} @ jac_jac_y[:n_parms + m, n_parms + m:] using LAPACK dgesv
 								    try:
 								        deriv_y = -scipy.linalg.solve(hess, jac_jac_y[:n_parms + m, n_parms + m:])
 								    except np.linalg.LinAlgError:
 								        raise Exception("Cannot invert hessian matrix.")
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    result = []
 								    for i in range(n_parms):
-												fix: fits and root now work when the value of the zeroth input is
exactly zero. Tests extended.

											
										
										
											2021-12-07 18:40:36 +00:00
+								        result.append(derived_observable(lambda my_var, **kwargs: (my_var[0] + np.finfo(np.float64).eps) / (x.ravel()[0].value + np.finfo(np.float64).eps) * out.beta[i], list(x.ravel()) + list(y), man_grad=list(deriv_x[i]) + list(deriv_y[i])))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												refactor!: const_par keyword for constrained fits removed from functions
in fit module.

											
										
										
											2022-01-24 17:43:23 +00:00
+								    output.fit_parameters = result
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												Fit_result gammma_method, str and repr added

											
										
										
											2021-10-31 12:00:26 +00:00
+								    output.odr_chisquare = odr_chisquare(np.concatenate((out.beta, out.xplus.ravel())))
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.dof = x.shape[-1] - n_parms
-												refactor: imports of scipy.stats in fits simplified.

											
										
										
											2022-06-15 14:14:01 +01:00
+								    output.p_value = 1 - scipy.stats.chi2.cdf(output.odr_chisquare, output.dof)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    return output
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												documentation of fit functions adjusted, deprecation warnings added to
standard_fit and prior_fit

											
										
										
											2021-11-01 14:54:36 +00:00
+								def _prior_fit(x, y, func, priors, silent=False, **kwargs):
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output = Fit_result()
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.fit_function = func
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    x = np.asarray(x)
-												feat: least_squares fit error propagation can now also be performed via
numerical derivatives.

											
										
										
											2022-10-05 17:44:38 +01:00
+								    if kwargs.get('num_grad') is True:
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								        hessian = num_hessian
-												feat: least_squares fit error propagation can now also be performed via
numerical derivatives.

											
										
										
											2022-10-05 17:44:38 +01:00
+								    else:
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								        hessian = auto_hessian
-												feat: least_squares fit error propagation can now also be performed via
numerical derivatives.

											
										
										
											2022-10-05 17:44:38 +01:00
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    if not callable(func):
 								        raise TypeError('func has to be a function.')
 								    for i in range(100):
 								        try:
 								            func(np.arange(i), 0)
-												refactor: Unused variable in fit function detection removed.

											
										
										
											2022-06-24 13:12:53 +01:00
+								        except TypeError:
 								            continue
 								        except IndexError:
-												fix: detection of invalid fit functions extended.

											
										
										
											2022-06-24 12:50:26 +01:00
+								            continue
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        else:
 								            break
-												fix: detection of invalid fit functions extended.

											
										
										
											2022-06-24 12:50:26 +01:00
+								    else:
 								        raise RuntimeError("Fit function is not valid.")
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    n_parms = i
 								    if n_parms != len(priors):
 								        raise Exception('Priors does not have the correct length.')
 								    def extract_val_and_dval(string):
 								        split_string = string.split('(')
 								        if '.' in split_string[0] and '.' not in split_string[1][:-1]:
 								            factor = 10 ** -len(split_string[0].partition('.')[2])
 								        else:
 								            factor = 1
 								        return float(split_string[0]), float(split_string[1][:-1]) * factor
 								    loc_priors = []
 								    for i_n, i_prior in enumerate(priors):
 								        if isinstance(i_prior, Obs):
 								            loc_priors.append(i_prior)
 								        else:
 								            loc_val, loc_dval = extract_val_and_dval(i_prior)
-												feat: priors in fits replaced by covobs, random hash added to avoid
prior collisions.

											
										
										
											2021-12-09 12:36:28 +00:00
+								            loc_priors.append(cov_Obs(loc_val, loc_dval ** 2, '#prior' + str(i_n) + f"_{np.random.randint(2147483647):010d}"))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.priors = loc_priors
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    if not silent:
-												feat: stdout of fit routines improved

											
										
										
											2022-01-24 13:22:35 +00:00
+								        print('Fit with', n_parms, 'parameter' + 's' * (n_parms > 1))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    y_f = [o.value for o in y]
 								    dy_f = [o.dvalue for o in y]
 								    if np.any(np.asarray(dy_f) <= 0.0):
 								        raise Exception('No y errors available, run the gamma method first.')
 								    p_f = [o.value for o in loc_priors]
 								    dp_f = [o.dvalue for o in loc_priors]
 								    if np.any(np.asarray(dp_f) <= 0.0):
 								        raise Exception('No prior errors available, run the gamma method first.')
 								    if 'initial_guess' in kwargs:
 								        x0 = kwargs.get('initial_guess')
 								        if len(x0) != n_parms:
 								            raise Exception('Initial guess does not have the correct length.')
 								    else:
 								        x0 = p_f
 								    def chisqfunc(p):
 								        model = func(p, x)
 								        chisq = anp.sum(((y_f - model) / dy_f) ** 2) + anp.sum(((p_f - p) / dp_f) ** 2)
 								        return chisq
 								    if not silent:
 								        print('Method: migrad')
-												fix: prior fit routine adjusted to work with iminuit version >= 2

											
										
										
											2021-12-09 12:50:52 +00:00
+								    m = iminuit.Minuit(chisqfunc, x0)
 								    m.errordef = 1
 								    m.print_level = 0
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    if 'tol' in kwargs:
 								        m.tol = kwargs.get('tol')
 								    else:
 								        m.tol = 1e-4
 								    m.migrad()
-												fix: prior fit routine adjusted to work with iminuit version >= 2

											
										
										
											2021-12-09 12:50:52 +00:00
+								    params = np.asarray(m.values)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.chisquare_by_dof = m.fval / len(x)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.method = 'migrad'
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    if not silent:
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								        print('chisquare/d.o.f.:', output.chisquare_by_dof)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fix: deprecated get_fmin call removed in fits

											
										
										
											2021-12-07 17:34:02 +00:00
+								    if not m.fmin.is_valid:
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								        raise Exception('The minimization procedure did not converge.')
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								    hess = hessian(chisqfunc)(params)
-												fix: index of num diff jacobian in least squares fit corrected.

											
										
										
											2022-10-05 17:54:25 +01:00
+								    hess_inv = np.linalg.pinv(hess)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    def chisqfunc_compact(d):
 								        model = func(d[:n_parms], x)
 								        chisq = anp.sum(((d[n_parms: n_parms + len(x)] - model) / dy_f) ** 2) + anp.sum(((d[n_parms + len(x):] - d[:n_parms]) / dp_f) ** 2)
 								        return chisq
-												feat: hessian added to prior fit and odr fit routines.

											
										
										
											2022-10-06 18:07:19 +01:00
+								    jac_jac = hessian(chisqfunc_compact)(np.concatenate((params, y_f, p_f)))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    deriv = -hess_inv @ jac_jac[:n_parms, n_parms:]
 								    result = []
 								    for i in range(n_parms):
-												fix: fits and root now work when the value of the zeroth input is
exactly zero. Tests extended.

											
										
										
											2021-12-07 18:40:36 +00:00
+								        result.append(derived_observable(lambda x, **kwargs: (x[0] + np.finfo(np.float64).eps) / (y[0].value + np.finfo(np.float64).eps) * params[i], list(y) + list(loc_priors), man_grad=list(deriv[i])))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    output.fit_parameters = result
 								    output.chisquare = chisqfunc(np.asarray(params))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    if kwargs.get('resplot') is True:
 								        residual_plot(x, y, func, result)
 								    if kwargs.get('qqplot') is True:
 								        qqplot(x, y, func, result)
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								    return output
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								def _combined_fit(x, y, func, silent=False, **kwargs):
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    output = Fit_result()
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
 								    if (type(x) == dict and type(y) == dict and type(func) == dict):
 								        xd = x
 								        yd = y
 								        funcd = func
 								        output.fit_function = func
 								    elif (type(x) == dict or type(y) == dict or type(func) == dict):
 								        raise TypeError("All arguments have to be dictionaries in order to perform a combined fit.")
 								    else:
 								        x = np.asarray(x)
 								        xd = {"": x}
 								        yd = {"": y}
 								        funcd = {"": func}
 								        output.fit_function = func
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    if kwargs.get('num_grad') is True:
 								        jacobian = num_jacobian
 								        hessian = num_hessian
 								    else:
 								        jacobian = auto_jacobian
 								        hessian = auto_hessian
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    key_ls = sorted(list(xd.keys()))
-												fix/tests: Combined fit now also works when the keys of the x,y & func input dictionaries are not in the same order, build: improvements in performance

											
										
										
											2023-01-30 14:26:47 +01:00
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    if sorted(list(yd.keys())) != key_ls:
-												fix/tests: Combined fit now also works when the keys of the x,y & func input dictionaries are not in the same order, build: improvements in performance

											
										
										
											2023-01-30 14:26:47 +01:00
+								        raise Exception('x and y dictionaries do not contain the same keys.')
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    if sorted(list(funcd.keys())) != key_ls:
-												fix/tests: Combined fit now also works when the keys of the x,y & func input dictionaries are not in the same order, build: improvements in performance

											
										
										
											2023-01-30 14:26:47 +01:00
+								        raise Exception('x and func dictionaries do not contain the same keys.')
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    x_all = np.concatenate([np.array(xd[key]) for key in key_ls])
 								    y_all = np.concatenate([np.array(yd[key]) for key in key_ls])
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								    y_f = [o.value for o in y_all]
 								    dy_f = [o.dvalue for o in y_all]
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    if len(x_all.shape) > 2:
 								        raise Exception('Unknown format for x values')
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								    if np.any(np.asarray(dy_f) <= 0.0):
 								        raise Exception('No y errors available, run the gamma method first.')
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    # number of fit parameters
 								    n_parms_ls = []
-												fix/tests: Combined fit now also works when the keys of the x,y & func input dictionaries are not in the same order, build: improvements in performance

											
										
										
											2023-01-30 14:26:47 +01:00
+								    for key in key_ls:
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								        if not callable(funcd[key]):
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								            raise TypeError('func (key=' + key + ') is not a function.')
-												fix: multi dim fits fixed in least squares. Test added. (#160)

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>
											
										
										
											2023-03-03 16:35:26 +00:00
+								        if np.asarray(xd[key]).shape[-1] != len(yd[key]):
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								            raise Exception('x and y input (key=' + key + ') do not have the same length')
-												fix/tests: Combined fit now also works when the keys of the x,y & func input dictionaries are not in the same order, build: improvements in performance

											
										
										
											2023-01-30 14:26:47 +01:00
+								        for i in range(100):
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								            try:
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								                funcd[key](np.arange(i), x_all.T[0])
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								            except TypeError:
 								                continue
 								            except IndexError:
 								                continue
 								            else:
 								                break
 								        else:
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								            raise RuntimeError("Fit function (key=" + key + ") is not valid.")
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        n_parms = i
 								        n_parms_ls.append(n_parms)
 								    n_parms = max(n_parms_ls)
 								    if not silent:
 								        print('Fit with', n_parms, 'parameter' + 's' * (n_parms > 1))
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    if 'initial_guess' in kwargs:
 								        x0 = kwargs.get('initial_guess')
 								        if len(x0) != n_parms:
 								            raise Exception('Initial guess does not have the correct length: %d vs. %d' % (len(x0), n_parms))
 								    else:
 								        x0 = [0.1] * n_parms
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								    def general_chisqfunc_uncorr(p, ivars):
 								        model = anp.concatenate([anp.array(funcd[key](p, anp.asarray(xd[key]))).reshape(-1) for key in key_ls])
 								        return ((ivars - model) / dy_f)
 								    def chisqfunc_uncorr(p):
 								        return anp.sum(general_chisqfunc_uncorr(p, y_f) ** 2)
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								    if kwargs.get('correlated_fit') is True:
 								        corr = covariance(y_all, correlation=True, **kwargs)
 								        covdiag = np.diag(1 / np.asarray(dy_f))
 								        condn = np.linalg.cond(corr)
 								        if condn > 0.1 / np.finfo(float).eps:
 								            raise Exception(f"Cannot invert correlation matrix as its condition number exceeds machine precision ({condn:1.2e})")
 								        if condn > 1e13:
 								            warnings.warn("Correlation matrix may be ill-conditioned, condition number: {%1.2e}" % (condn), RuntimeWarning)
 								        chol = np.linalg.cholesky(corr)
 								        chol_inv = scipy.linalg.solve_triangular(chol, covdiag, lower=True)
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								        def general_chisqfunc(p, ivars):
-												refactor: removed redundant formulations of the chisquare function in
least_squares.

											
										
										
											2023-03-01 16:26:37 +00:00
+								            model = anp.concatenate([anp.array(funcd[key](p, anp.asarray(xd[key]))).reshape(-1) for key in key_ls])
 								            return anp.dot(chol_inv, (ivars - model))
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								        def chisqfunc(p):
 								            return anp.sum(general_chisqfunc(p, y_f) ** 2)
 								    else:
 								        general_chisqfunc = general_chisqfunc_uncorr
 								        chisqfunc = chisqfunc_uncorr
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								    output.method = kwargs.get('method', 'Levenberg-Marquardt')
 								    if not silent:
 								        print('Method:', output.method)
 								    if output.method != 'Levenberg-Marquardt':
 								        if output.method == 'migrad':
-												fix: reduced the migrad solver tolerance + removed unnecessary check

											
										
										
											2023-01-30 15:16:41 +01:00
+								            tolerance = 1e-4  # default value of 1e-1 set by iminuit can be problematic
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								            if 'tol' in kwargs:
 								                tolerance = kwargs.get('tol')
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								            fit_result = iminuit.minimize(chisqfunc_uncorr, x0, tol=tolerance)  # Stopping criterion 0.002 * tol * errordef
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								            if kwargs.get('correlated_fit') is True:
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								                fit_result = iminuit.minimize(chisqfunc, fit_result.x, tol=tolerance)
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								            output.iterations = fit_result.nfev
 								        else:
 								            tolerance = 1e-12
 								            if 'tol' in kwargs:
 								                tolerance = kwargs.get('tol')
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								            fit_result = scipy.optimize.minimize(chisqfunc_uncorr, x0, method=kwargs.get('method'), tol=tolerance)
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								            if kwargs.get('correlated_fit') is True:
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								                fit_result = scipy.optimize.minimize(chisqfunc, fit_result.x, method=kwargs.get('method'), tol=tolerance)
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								            output.iterations = fit_result.nit
 								        chisquare = fit_result.fun
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    else:
 								        if 'tol' in kwargs:
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								            print('tol cannot be set for Levenberg-Marquardt')
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								        def chisqfunc_residuals_uncorr(p):
 								            return general_chisqfunc_uncorr(p, y_f)
 								        fit_result = scipy.optimize.least_squares(chisqfunc_residuals_uncorr, x0, method='lm', ftol=1e-15, gtol=1e-15, xtol=1e-15)
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								        if kwargs.get('correlated_fit') is True:
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
 								            def chisqfunc_residuals(p):
 								                return general_chisqfunc(p, y_f)
 								            fit_result = scipy.optimize.least_squares(chisqfunc_residuals, fit_result.x, method='lm', ftol=1e-15, gtol=1e-15, xtol=1e-15)
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
 								        chisquare = np.sum(fit_result.fun ** 2)
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								        assert np.isclose(chisquare, chisqfunc(fit_result.x), atol=1e-14)
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								        output.iterations = fit_result.nfev
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    if not fit_result.success:
 								        raise Exception('The minimization procedure did not converge.')
 								    if x_all.shape[-1] - n_parms > 0:
-												feat: added (default) method Levenberg-Marquardt, test added

											
										
										
											2022-12-20 15:26:13 +01:00
+								        output.chisquare = chisquare
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        output.dof = x_all.shape[-1] - n_parms
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								        output.chisquare_by_dof = output.chisquare / output.dof
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        output.p_value = 1 - scipy.stats.chi2.cdf(output.chisquare, output.dof)
 								    else:
 								        output.chisquare_by_dof = float('nan')
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								    output.message = fit_result.message
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    if not silent:
 								        print(fit_result.message)
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								        print('chisquare/d.o.f.:', output.chisquare_by_dof)
 								        print('fit parameters', fit_result.x)
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    def prepare_hat_matrix():
 								        hat_vector = []
-												fix/tests: Combined fit now also works when the keys of the x,y & func input dictionaries are not in the same order, build: improvements in performance

											
										
										
											2023-01-30 14:26:47 +01:00
+								        for key in key_ls:
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								            x_array = np.asarray(xd[key])
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								            if (len(x_array) != 0):
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								                hat_vector.append(jacobian(funcd[key])(fit_result.x, x_array))
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								        hat_vector = [item for sublist in hat_vector for item in sublist]
 								        return hat_vector
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								    if kwargs.get('expected_chisquare') is True:
 								        if kwargs.get('correlated_fit') is not True:
 								            W = np.diag(1 / np.asarray(dy_f))
 								            cov = covariance(y_all)
 								            hat_vector = prepare_hat_matrix()
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								            A = W @ hat_vector
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								            P_phi = A @ np.linalg.pinv(A.T @ A) @ A.T
 								            expected_chisquare = np.trace((np.identity(x_all.shape[-1]) - P_phi) @ W @ cov @ W)
 								            output.chisquare_by_expected_chisquare = output.chisquare / expected_chisquare
 								            if not silent:
 								                print('chisquare/expected_chisquare:', output.chisquare_by_expected_chisquare)
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								    fitp = fit_result.x
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    if np.any(np.asarray(dy_f) <= 0.0):
 								        raise Exception('No y errors available, run the gamma method first.')
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    try:
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								        hess = hessian(chisqfunc)(fitp)
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    except TypeError:
 								        raise Exception("It is required to use autograd.numpy instead of numpy within fit functions, see the documentation for details.") from None
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												refactor: logic in least square fits simplified.

Co-authored-by: Simon Kuberski <simon.kuberski@uni-muenster.de>

											
										
										
											2023-03-02 18:39:57 +00:00
+								    def chisqfunc_compact(d):
 								        return anp.sum(general_chisqfunc(d[:n_parms], d[n_parms:]) ** 2)
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    jac_jac_y = hessian(chisqfunc_compact)(np.concatenate((fitp, y_f)))
 								    # Compute hess^{-1} @ jac_jac_y[:n_parms + m, n_parms + m:] using LAPACK dgesv
 								    try:
 								        deriv_y = -scipy.linalg.solve(hess, jac_jac_y[:n_parms, n_parms:])
 								    except np.linalg.LinAlgError:
 								        raise Exception("Cannot invert hessian matrix.")
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    result = []
 								    for i in range(n_parms):
 								        result.append(derived_observable(lambda x_all, **kwargs: (x_all[0] + np.finfo(np.float64).eps) / (y_all[0].value + np.finfo(np.float64).eps) * fitp[i], list(y_all), man_grad=list(deriv_y[i])))
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
+								    output.fit_parameters = result
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    # Hotelling t-squared p-value for correlated fits.
-												feat/tests: Correlated fits now also work for combined fits.

											
										
										
											2023-02-03 14:54:54 +01:00
+								    if kwargs.get('correlated_fit') is True:
 								        n_cov = np.min(np.vectorize(lambda x_all: x_all.N)(y_all))
 								        output.t2_p_value = 1 - scipy.stats.f.cdf((n_cov - output.dof) / (output.dof * (n_cov - 1)) * output.chisquare,
 								                                                  output.dof, n_cov - output.dof)
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    if kwargs.get('resplot') is True:
 								        for key in key_ls:
 								            residual_plot(xd[key], yd[key], funcd[key], result, title=key)
 								    if kwargs.get('qqplot') is True:
 								        for key in key_ls:
 								            qqplot(xd[key], yd[key], funcd[key], result, title=key)
-												fix: flak8 & pytest

											
										
										
											2022-12-19 14:03:45 +01:00
+								    return output
-												incorparated (uncorrelated) combined fits in fits.least_squares

											
										
										
											2022-12-16 18:47:25 +01:00
-												total_least_squares docstring updated

											
										
										
											2021-11-08 09:50:51 +00:00
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								def fit_lin(x, y, **kwargs):
 								    """Performs a linear fit to y = n + m * x and returns two Obs n, m.
-												docs: formatting of docstrings improved.

											
										
										
											2022-03-05 08:43:57 +00:00
+								    Parameters
 								    ----------
 								    x : list
 								        Can either be a list of floats in which case no xerror is assumed, or
 								        a list of Obs, where the dvalues of the Obs are used as xerror for the fit.
 								    y : list
 								        List of Obs, the dvalues of the Obs are used as yerror for the fit.
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
 								    Returns
 								    -------
 								    fit_parameters : list[Obs]
 								        LIist of fitted observables.
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    """
 								    def f(a, x):
 								        y = a[0] + a[1] * x
 								        return y
 								    if all(isinstance(n, Obs) for n in x):
-												refactor!: fit_general deprecated and moved to tests

											
										
										
											2021-12-09 10:11:31 +00:00
+								        out = total_least_squares(x, y, f, **kwargs)
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								        return out.fit_parameters
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    elif all(isinstance(n, float) or isinstance(n, int) for n in x) or isinstance(x, np.ndarray):
-												refactor!: fit_general deprecated and moved to tests

											
										
										
											2021-12-09 10:11:31 +00:00
+								        out = least_squares(x, y, f, **kwargs)
-												fit_result class added

											
										
										
											2021-10-31 11:06:12 +00:00
+								        return out.fit_parameters
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    else:
 								        raise Exception('Unsupported types for x')
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								def qqplot(x, o_y, func, p, title=""):
-												docs: formatting of docstrings improved.

											
										
										
											2022-03-05 08:43:57 +00:00
+								    """Generates a quantile-quantile plot of the fit result which can be used to
 								       check if the residuals of the fit are gaussian distributed.
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
 								    Returns
 								    -------
 								    None
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    """
 								    residuals = []
 								    for i_x, i_y in zip(x, o_y):
 								        residuals.append((i_y - func(p, i_x)) / i_y.dvalue)
 								    residuals = sorted(residuals)
 								    my_y = [o.value for o in residuals]
 								    probplot = scipy.stats.probplot(my_y)
 								    my_x = probplot[0][0]
-												flake8 style changes

											
										
										
											2021-10-11 12:22:58 +01:00
+								    plt.figure(figsize=(8, 8 / 1.618))
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    plt.errorbar(my_x, my_y, fmt='o')
 								    fit_start = my_x[0]
 								    fit_stop = my_x[-1]
 								    samples = np.arange(fit_start, fit_stop, 0.01)
 								    plt.plot(samples, samples, 'k--', zorder=11, label='Standard normal distribution')
-												fix: formatting of qqplot fixed

											
										
										
											2022-03-11 14:54:24 +00:00
+								    plt.plot(samples, probplot[1][0] * samples + probplot[1][1], zorder=10, label='Least squares fit, r=' + str(np.around(probplot[1][2], 3)), marker='', ls='-')
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    plt.xlabel('Theoretical quantiles')
 								    plt.ylabel('Ordered Values')
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    plt.legend(title=title)
-												fix: instances of plot.show changed to plot.draw in fit module

											
										
										
											2021-12-07 08:27:24 +00:00
+								    plt.draw()
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								def residual_plot(x, y, func, fit_res, title=""):
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
+								    """Generates a plot which compares the fit to the data and displays the corresponding residuals
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    For uncorrelated data the residuals are expected to be distributed ~N(0,1).
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
+								    Returns
 								    -------
 								    None
 								    """
-												fix: automatic range of residual_plot improved.

											
										
										
											2022-04-06 16:02:10 +01:00
+								    sorted_x = sorted(x)
 								    xstart = sorted_x[0] - 0.5 * (sorted_x[1] - sorted_x[0])
 								    xstop = sorted_x[-1] + 0.5 * (sorted_x[-1] - sorted_x[-2])
 								    x_samples = np.arange(xstart, xstop + 0.01, 0.01)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    plt.figure(figsize=(8, 8 / 1.618))
 								    gs = gridspec.GridSpec(2, 1, height_ratios=[3, 1], wspace=0.0, hspace=0.0)
 								    ax0 = plt.subplot(gs[0])
 								    ax0.errorbar(x, [o.value for o in y], yerr=[o.dvalue for o in y], ls='none', fmt='o', capsize=3, markersize=5, label='Data')
-												Examples updated, minor bug fixes

											
										
										
											2021-10-11 18:31:02 +01:00
+								    ax0.plot(x_samples, func([o.value for o in fit_res], x_samples), label='Fit', zorder=10, ls='-', ms=0)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    ax0.set_xticklabels([])
 								    ax0.set_xlim([xstart, xstop])
 								    ax0.set_xticklabels([])
-												refactor: _standard_fit method made redundant. (#154)

* refactor: _standard_fit method made redundant.

* fix: xs and yz in Corr.fit promoted to arrays.

* fix: x promoted to array in _combined_fit if input is just a list.

* feat: residual_plot and qqplot now work with combined fits with
dictionary inputs.

* tests: test for combined fit resplot and qqplot added.

* docs: docstring of fits.residual_plot extended.
											
										
										
											2023-03-01 10:00:35 +00:00
+								    ax0.legend(title=title)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    residuals = (np.asarray([o.value for o in y]) - func([o.value for o in fit_res], x)) / np.asarray([o.dvalue for o in y])
 								    ax1 = plt.subplot(gs[1])
 								    ax1.plot(x, residuals, 'ko', ls='none', markersize=5)
 								    ax1.tick_params(direction='out')
 								    ax1.tick_params(axis="x", bottom=True, top=True, labelbottom=True)
-												fix: removed endpoints in axhline in fits.residual_plot

											
										
										
											2022-01-06 11:56:38 +01:00
+								    ax1.axhline(y=0.0, ls='--', color='k', marker=" ")
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
+								    ax1.fill_between(x_samples, -1.0, 1.0, alpha=0.1, facecolor='k')
 								    ax1.set_xlim([xstart, xstop])
 								    ax1.set_ylabel('Residuals')
 								    plt.subplots_adjust(wspace=None, hspace=None)
-												fix: instances of plot.show changed to plot.draw in fit module

											
										
										
											2021-12-07 08:27:24 +00:00
+								    plt.draw()
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								def error_band(x, func, beta):
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
+								    """Calculate the error band for an array of sample values x, for given fit function func with optimized parameters beta.
 								    Returns
 								    -------
 								    err : np.array(Obs)
 								        Error band for an array of sample values x
 								    """
-												feat: positive semi-definite estimator for the covariance implemented,
fits.covariance matrix deprecated, covariance can now handle lists of
observables.

											
										
										
											2022-03-01 09:45:25 +00:00
+								    cov = covariance(beta)
-												further instances of np.float removed

											
										
										
											2021-10-12 14:12:21 +01:00
+								    if np.any(np.abs(cov - cov.T) > 1000 * np.finfo(np.float64).eps):
-												Warning messages promoted to RuntimeWarnings

											
										
										
											2021-10-15 12:11:06 +01:00
+								        warnings.warn("Covariance matrix is not symmetric within floating point precision", RuntimeWarning)
-												Initial public release

											
										
										
											2020-10-13 16:53:00 +02:00
 								    deriv = []
 								    for i, item in enumerate(x):
 								        deriv.append(np.array(egrad(func)([o.value for o in beta], item)))
 								    err = []
 								    for i, item in enumerate(x):
 								        err.append(np.sqrt(deriv[i] @ cov @ deriv[i]))
 								    err = np.array(err)
 								    return err
-												feat: Automated Kolmogorov Smirnov test for fit p-values added

											
										
										
											2022-01-10 15:17:55 +01:00
 								def ks_test(objects=None):
 								    """Performs a Kolmogorov–Smirnov test for the p-values of all fit object.
 								    Parameters
 								    ----------
 								    objects : list
 								        List of fit results to include in the analysis (optional).
-												better docstrings (#144)

* first example of returns statement in docstring

* added a some return statements for pandas API

* last return statements in pandas input

* added returns to bdio docstrings

* few returns statements added to docstring

* finished docstrings for hadrons submodule

* also finished docstrings for json submodule

* finished misc submodule

* added returns in docstrings in openqQCD

* made some cosmetic chanes to dostrings

* added return nad return statement in docstring

* linting

* Improved docstrings of mpm, fits, roots, misc to have return statements

returns added for misc.py

returns added for mpm.py

reutrns added for fits.py

* linting...

* Some polishing of docstrings
											
										
										
											2023-01-16 15:57:22 +01:00
 								    Returns
 								    -------
 								    None
-												feat: Automated Kolmogorov Smirnov test for fit p-values added

											
										
										
											2022-01-10 15:17:55 +01:00
+								    """
 								    if objects is None:
 								        obs_list = []
 								        for obj in gc.get_objects():
 								            if isinstance(obj, Fit_result):
 								                obs_list.append(obj)
 								    else:
 								        obs_list = objects
 								    p_values = [o.p_value for o in obs_list]
 								    bins = len(p_values)
 								    x = np.arange(0, 1.001, 0.001)
 								    plt.plot(x, x, 'k', zorder=1)
 								    plt.xlim(0, 1)
 								    plt.ylim(0, 1)
 								    plt.xlabel('p-value')
 								    plt.ylabel('Cumulative probability')
 								    plt.title(str(bins) + ' p-values')
 								    n = np.arange(1, bins + 1) / np.float64(bins)
 								    Xs = np.sort(p_values)
 								    plt.step(Xs, n)
 								    diffs = n - Xs
 								    loc_max_diff = np.argmax(np.abs(diffs))
 								    loc = Xs[loc_max_diff]
 								    plt.annotate('', xy=(loc, loc), xytext=(loc, loc + diffs[loc_max_diff]), arrowprops=dict(arrowstyle='<->', shrinkA=0, shrinkB=0))
 								    plt.draw()
 								    print(scipy.stats.kstest(p_values, 'uniform'))