Refined covobs implementation

2026-02-20 03:52:45 +01:00 · 2021-11-30 11:08:30 +01:00 · 2021-11-30 11:08:30 +01:00 · 950fb17c84
commit 950fb17c84
parent 9db709a171
2 changed files with 194 additions and 145 deletions
--- a/pyerrors/obs.py
+++ b/pyerrors/obs.py
@ -38,11 +38,11 @@ class Obs:
        Dictionary for N_sigma values. If an entry for a given ensemble exists
        this overwrites the standard value for that ensemble.
    """
-    #__slots__ = ['names', 'shape', 'r_values', 'deltas', 'N', '_value', '_dvalue',
-    #             'ddvalue', 'reweighted', 'S', 'tau_exp', 'N_sigma',
-    #             'e_dvalue', 'e_ddvalue', 'e_tauint', 'e_dtauint',
-    #             'e_windowsize', 'e_rho', 'e_drho', 'e_n_tauint', 'e_n_dtauint',
-    #             'idl', 'is_merged', 'tag', '__dict__']
+    __slots__ = ['names', 'shape', 'r_values', 'deltas', 'N', '_value', '_dvalue',
+                 'ddvalue', 'reweighted', 'S', 'tau_exp', 'N_sigma',
+                 'e_dvalue', 'e_ddvalue', 'e_tauint', 'e_dtauint',
+                 'e_windowsize', 'e_rho', 'e_drho', 'e_n_tauint', 'e_n_dtauint',
+                 'idl', 'is_merged', 'tag', 'covobs', '__dict__']

    S_global = 2.0
    S_dict = {}
@ -68,7 +68,7 @@ class Obs:
            already subtracted from the samples
        """

-        if means is None and not kwargs.get('empty', False):
+        if means is None and samples is not None:
            if len(samples) != len(names):
                raise Exception('Length of samples and names incompatible.')
            if idl is not None:
@ -81,10 +81,10 @@ class Obs:
            if min(len(x) for x in samples) <= 4:
                raise Exception('Samples have to have at least 5 entries.')
        
-        if kwargs.get('empty', False):
-            self.names = []
-        else:
+        if names:
            self.names = sorted(names)
+        else:
+            self.names = []

        self.shape = {}
        self.r_values = {}
@ -95,7 +95,7 @@ class Obs:
            self.covobs = covobs

        self.idl = {}
-        if not kwargs.get('empty', False):
+        if samples is not None:
            if idl is not None:
                for name, idx in sorted(zip(names, idl)):
                    if isinstance(idx, range):
@ -159,6 +159,14 @@ class Obs:
    def e_names(self):
        return sorted(set([o.split('|')[0] for o in self.names]))

+    @property
+    def cov_names(self):
+        return sorted(set([o for o in self.covobs.keys()]))
+
+    @property
+    def mc_names(self):
+        return sorted(set([o.split('|')[0] for o in self.names if o not in self.cov_names]))
+
    @property
    def e_content(self):
        res = {}
@ -233,8 +241,7 @@ class Obs:
        _parse_kwarg('tau_exp')
        _parse_kwarg('N_sigma')

-        for e, e_name in enumerate(self.e_names):
-            if e_name not in self.covobs:
+        for e, e_name in enumerate(self.mc_names):
            r_length = []
            for r_name in e_content[e_name]:
                if isinstance(self.idl[r_name], range):
@ -320,7 +327,7 @@ class Obs:
                self._dvalue += self.e_dvalue[e_name] ** 2
                self.ddvalue += (self.e_dvalue[e_name] * self.e_ddvalue[e_name]) ** 2

-            else:
+        for e_name in self.cov_names:
            self.e_dvalue[e_name] = np.sqrt(self.covobs[e_name].errsq())
            self.e_ddvalue[e_name] = 0
            self._dvalue += self.e_dvalue[e_name]**2
@ -385,15 +392,14 @@ class Obs:
            print('Result\t %3.8e +/- %3.8e +/- %3.8e (%3.3f%%)' % (self.value, self.dvalue, self.ddvalue, percentage))
            if len(self.e_names) > 1:
                print(' Ensemble errors:')
-            for e_name in self.e_names:
-                if e_name not in self.covobs:
+            for e_name in self.mc_names:
                if len(self.e_names) > 1:
                    print('', e_name, '\t %3.8e +/- %3.8e' % (self.e_dvalue[e_name], self.e_ddvalue[e_name]))
                if self.tau_exp[e_name] > 0:
                    print(' t_int\t %3.8e +/- %3.8e tau_exp = %3.2f,  N_sigma = %1.0i' % (self.e_tauint[e_name], self.e_dtauint[e_name], self.tau_exp[e_name], self.N_sigma[e_name]))
                else:
                    print(' t_int\t %3.8e +/- %3.8e S = %3.2f' % (self.e_tauint[e_name], self.e_dtauint[e_name], self.S[e_name]))
-                else:
+            for e_name in self.cov_names:
                print('', e_name, '\t %3.8e' % (self.e_dvalue[e_name]))
        if ens_content is True:
            if len(self.e_names) == 1:
@ -467,7 +473,7 @@ class Obs:
            raise Exception('Run the gamma method first.')

        fig = plt.figure()
-        for e, e_name in enumerate(self.e_names):
+        for e, e_name in enumerate(self.mc_names):
            plt.xlabel(r'$W$')
            plt.ylabel(r'$\tau_\mathrm{int}$')
            length = int(len(self.e_n_tauint[e_name]))
@ -498,7 +504,7 @@ class Obs:
        """Plot normalized autocorrelation function time for each ensemble."""
        if not hasattr(self, 'e_dvalue'):
            raise Exception('Run the gamma method first.')
-        for e, e_name in enumerate(self.e_names):
+        for e, e_name in enumerate(self.mc_names):
            plt.xlabel('W')
            plt.ylabel('rho')
            length = int(len(self.e_drho[e_name]))
@ -520,7 +526,7 @@ class Obs:
        """Plot replica distribution for each ensemble with more than one replicum."""
        if not hasattr(self, 'e_dvalue'):
            raise Exception('Run the gamma method first.')
-        for e, e_name in enumerate(self.e_names):
+        for e, e_name in enumerate(self.mc_names):
            if len(self.e_content[e_name]) == 1:
                print('No replica distribution for a single replicum (', e_name, ')')
                continue
@ -546,7 +552,7 @@ class Obs:
        expand : bool
            show expanded history for irregular Monte Carlo chains (default: True).
        """
-        for e, e_name in enumerate(self.e_names):
+        for e, e_name in enumerate(self.mc_names):
            plt.figure()
            r_length = []
            tmp = []
@ -1055,7 +1061,7 @@ def derived_observable(func, data, **kwargs):

    allcov = {}
    for o in raveled_data:
-        for name in o.covobs:
+        for name in o.cov_names:
            if name in allcov:
                if not np.array_equal(allcov[name], o.covobs[name].cov):
                    raise Exception('Inconsistent covariance matrices for %s!' % (name))
@ -1137,7 +1143,7 @@ def derived_observable(func, data, **kwargs):
        new_grad = {}
        for j_obs, obs in np.ndenumerate(data):
            for name in obs.names:
-                if name in obs.covobs:
+                if name in obs.cov_names:
                    if name in new_grad:
                        new_grad[name] += deriv[i_val + j_obs] * obs.covobs[name].grad
                    else:
@ -1231,6 +1237,8 @@ def reweight(weight, obs, **kwargs):
    """
    result = []
    for i in range(len(obs)):
+        if len(obs[i].cov_names):
+            raise Exception('Error: Not possible to reweight an Obs that contains covobs!')
        if sorted(weight.names) != sorted(obs[i].names):
            raise Exception('Error: Ensembles do not fit')
        for name in weight.names:
@ -1272,6 +1280,8 @@ def correlate(obs_a, obs_b):

    if sorted(obs_a.names) != sorted(obs_b.names):
        raise Exception('Ensembles do not fit')
+    if len(obs_a.cov_names) or len(obs_b.cov_names):
+        raise Exception('Error: Not possible to correlate Obs that contain covobs!')
    for name in obs_a.names:
        if obs_a.shape[name] != obs_b.shape[name]:
            raise Exception('Shapes of ensemble', name, 'do not fit')
@ -1329,7 +1339,7 @@ def covariance(obs1, obs2, correlation=False, **kwargs):

    dvalue = 0

-    for e_name in obs1.e_names:
+    for e_name in obs1.mc_names:

        if e_name not in obs2.e_names:
            continue
@ -1349,6 +1359,13 @@ def covariance(obs1, obs2, correlation=False, **kwargs):
        tau_combined = (obs1.e_tauint[e_name] + obs2.e_tauint[e_name]) / 2
        dvalue += gamma / e_N * (1 + 1 / e_N) / e_N * 2 * tau_combined

+    for e_name in obs1.cov_names:
+
+        if e_name not in obs2.cov_names:
+            continue
+
+        dvalue += float(np.dot(np.transpose(obs1.covobs[e_name].grad), np.dot(obs1.covobs[e_name].cov, obs2.covobs[e_name].grad)))
+
    if np.abs(dvalue / obs1.dvalue / obs2.dvalue) > 1.0:
        dvalue = np.sign(dvalue) * obs1.dvalue * obs2.dvalue

@ -1420,9 +1437,9 @@ def covariance2(obs1, obs2, correlation=False, **kwargs):
    e_n_tauint = {}
    e_rho = {}

-    for e_name in obs1.e_names:
+    for e_name in obs1.mc_names:

-        if e_name not in obs2.e_names:
+        if e_name not in obs2.mc_names:
            continue

        idl_d = {}
@ -1473,6 +1490,13 @@ def covariance2(obs1, obs2, correlation=False, **kwargs):

        dvalue += e_dvalue[e_name]

+    for e_name in obs1.cov_names:
+
+        if e_name not in obs2.cov_names:
+            continue
+
+        dvalue += float(np.dot(np.transpose(obs1.covobs[e_name].grad), np.dot(obs1.covobs[e_name].cov, obs2.covobs[e_name].grad)))
+
    if np.abs(dvalue / obs1.dvalue / obs2.dvalue) > 1.0:
        dvalue = np.sign(dvalue) * obs1.dvalue * obs2.dvalue

@ -1610,6 +1634,8 @@ def merge_obs(list_of_obs):
    replist = [item for obs in list_of_obs for item in obs.names]
    if (len(replist) == len(set(replist))) is False:
        raise Exception('list_of_obs contains duplicate replica: %s' % (str(replist)))
+    if any([len(o.cov_names) for o in list_of_obs]):
+        raise Exception('Not possible to merge data that contains covobs!')
    new_dict = {}
    idl_dict = {}
    for o in list_of_obs:
@ -1624,6 +1650,21 @@ def merge_obs(list_of_obs):
    return o


+def cov_Obs(means, cov, name, grad=None):
+    """Create an Obs based on mean(s) and a covariance matrix
+
+    Parameters
+    ----------
+    mean : list of floats or float
+        N mean value(s) of the new Obs
+    cov : list or array
+        2d (NxN) Covariance matrix, 1d diagonal entries or 0d covariance
+    name : str
+        identifier for the covariance matrix
+    grad : list or array
+        Gradient of the Covobs wrt. the means belonging to cov.
+    """
+
    def covobs_to_obs(co):
        """Make an Obs out of a Covobs

@ -1641,44 +1682,14 @@ def covobs_to_obs(co):
        o.idl[co.name] = []
        return o

-
-def create_Covobs(mean, cov, name, pos=None, grad=None):
-    """Make an Obs based on a Covobs
-
-    Parameters
-    ----------
-    mean : float
-        Mean value of the new Obs
-    cov : list or array
-        2d Covariance matrix or 1d diagonal entries
-    name : str
-        identifier for the covariance matrix
-    pos : int
-        Position of the variance belonging to mean in cov.
-        Is taken to be 1 if cov is 0-dimensional
-    grad : list or array
-        Gradient of the Covobs wrt. the means belonging to cov.
-    """
-    return covobs_to_obs(Covobs(mean, cov, name, pos=pos, grad=grad))
-
-
-def create_Covobs_list(means, cov, name, grad=None):
-    """Make a list of Obs based Covobs
-
-    Parameters
-    ----------
-    mean : list of floats
-        N mean values of the new Obs
-    cov : list or array
-        2d (NxN) Covariance matrix or 1d diagonal entries
-    name : str
-        identifier for the covariance matrix
-    grad : list or array
-        Gradient of the Covobs wrt. the means belonging to cov.
-    """
    ol = []
+    if isinstance(means, (float, int)):
+        means = [means]
+
    for i in range(len(means)):
        ol.append(covobs_to_obs(Covobs(means[i], cov, name, pos=i, grad=grad)))
    if ol[0].covobs[name].N != len(means):
        raise Exception('You have to provide %d mean values!' % (ol[0].N))
+    if len(ol) == 1:
+        return ol[0]
    return ol
--- a/tests/obs_test.py
+++ b/tests/obs_test.py
@ -543,3 +543,41 @@ def test_import_jackknife():
    reconstructed_obs = pe.import_jackknife(my_jacks, 'test')
    assert my_obs == reconstructed_obs

+
+def test_covobs():
+    val = 1.123124
+    cov = .243423
+    name = 'Covariance'
+    co = pe.cov_Obs(val, cov, name)
+    co.gamma_method()
+    assert (co.dvalue == np.sqrt(cov))
+    assert (co.value == val)
+
+    do = 2 * co
+    assert (do.covobs[name].grad[0] == 2)
+
+    do = co * co
+    assert (do.covobs[name].grad[0] == 2 * val)
+    assert np.array_equal(do.covobs[name].cov, co.covobs[name].cov)
+
+    pi = [16.7457, -19.0475]
+    cov = [[3.49591, -6.07560], [-6.07560, 10.5834]]
+
+    cl = pe.cov_Obs(pi, cov, 'rAP')
+    pl = pe.misc.gen_correlated_data(pi, np.asarray(cov), 'rAPpseudo')
+
+    def rAP(p, g0sq):
+        return -0.0010666 * g0sq * (1 + np.exp(p[0] + p[1] / g0sq))
+
+    for g0sq in [1, 1.5, 1.8]:
+        oc = rAP(cl, g0sq)
+        oc.gamma_method()
+        op = rAP(pl, g0sq)
+        op.gamma_method()
+        assert(np.isclose(oc.value, op.value, rtol=1e-14, atol=1e-14))
+
+    assert(pe.covariance(cl[0], cl[1]) == cov[0][1])
+    assert(pe.covariance2(cl[0], cl[1]) == cov[1][0])
+
+    do = cl[0] * cl[1]
+    assert(np.array_equal(do.covobs['rAP'].grad, np.transpose([pi[1], pi[0]]).reshape(2, 1)))