From cb31e681b8ee73f77fa5146127f7d1e7b9698940 Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Tue, 31 Jan 2023 17:44:49 +0000
Subject: [PATCH 1/9] fix: rescaled incomplete measurements.

---
 pyerrors/obs.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyerrors/obs.py b/pyerrors/obs.py
index 9df6b5c2..713cae0b 100644
--- a/pyerrors/obs.py
+++ b/pyerrors/obs.py
@@ -1097,7 +1097,7 @@ def _expand_deltas_for_merge(deltas, idx, shape, new_idx):
     ret = np.zeros(new_idx[-1] - new_idx[0] + 1)
     for i in range(shape):
         ret[idx[i] - new_idx[0]] = deltas[i]
-    return np.array([ret[new_idx[i] - new_idx[0]] for i in range(len(new_idx))])
+    return np.array([ret[new_idx[i] - new_idx[0]] for i in range(len(new_idx))]) * len(new_idx) / len(idx)
 
 
 def derived_observable(func, data, array_mode=False, **kwargs):

From 2e490e56f4bcf6fb143b1409468029cf1a716470 Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Thu, 2 Feb 2023 13:35:08 +0000
Subject: [PATCH 2/9] fix: fixed test intersection reduce.

---
 tests/obs_test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/obs_test.py b/tests/obs_test.py
index b01ed034..7f76a15f 100644
--- a/tests/obs_test.py
+++ b/tests/obs_test.py
@@ -566,7 +566,7 @@ def test_intersection_reduce():
     intersection = pe.obs._intersection_idx([o.idl["ens"] for o in [obs1, obs_merge]])
     coll = pe.obs._reduce_deltas(obs_merge.deltas["ens"], obs_merge.idl["ens"], range1)
 
-    assert np.all(coll == obs1.deltas["ens"])
+    assert np.allclose(coll, obs1.deltas["ens"] * (len(obs_merge.idl["ens"]) / len(range1)))
 
 
 def test_irregular_error_propagation():

From b3d030abf3a0e9c5a67daacc94511b12dd66a43f Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Thu, 2 Feb 2023 13:42:15 +0000
Subject: [PATCH 3/9] fix: fixed test_correlation_intersection_of_idls

---
 tests/obs_test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/obs_test.py b/tests/obs_test.py
index 7f76a15f..4d84be63 100644
--- a/tests/obs_test.py
+++ b/tests/obs_test.py
@@ -878,7 +878,7 @@ def test_correlation_intersection_of_idls():
     cov1 = pe.covariance([obs1, obs2_a])
     corr1 = pe.covariance([obs1, obs2_a], correlation=True)
 
-    obs2_b = obs2_a + pe.Obs([np.random.normal(1.0, 0.1, len(range2))], ["ens"], idl=[range2])
+    obs2_b = (obs2_a + pe.Obs([np.random.normal(1.0, 0.1, len(range2))], ["ens"], idl=[range2])) / 2
     obs2_b.gamma_method()
 
     cov2 = pe.covariance([obs1, obs2_b])

From f6df9d02f5b0b3c4b571702ff324c87565b93e34 Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Thu, 2 Feb 2023 13:49:40 +0000
Subject: [PATCH 4/9] test: added additional tests for non-overlapping
 configurations.

---
 tests/obs_test.py | 53 +++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 53 insertions(+)

diff --git a/tests/obs_test.py b/tests/obs_test.py
index 4d84be63..bb93538f 100644
--- a/tests/obs_test.py
+++ b/tests/obs_test.py
@@ -1038,6 +1038,7 @@ def test_hash():
     assert hash(obs) != hash(o1)
     assert hash(o1) != hash(o2)
 
+
 def test_gm_alias():
     samples = np.random.rand(500)
 
@@ -1049,3 +1050,55 @@ def test_gm_alias():
 
     assert np.isclose(tt1.dvalue, tt2.dvalue)
 
+
+def test_overlapping_missing_cnfgs():
+    length = 200000
+
+    l_samp = np.random.normal(2.87, 0.5, length)
+    s_samp = np.random.normal(7.87, 0.7, length // 2)
+
+    o1 = pe.Obs([l_samp], ["test"])
+    o2 = pe.Obs([s_samp], ["test"], idl=[range(1, length, 2)])
+
+    a2 = pe.Obs([s_samp], ["alt"])
+    t1 = o1 + o2
+    t1.gm(S=0)
+
+    t2 = o1 + a2
+    t2.gm(S=0)
+    assert np.isclose(t1.dvalue, t2.dvalue, rtol=0.01)
+
+
+def test_non_overlapping_missing_cnfgs():
+    length = 100000
+
+    xsamp = np.random.normal(1.0, 1.0, length)
+
+
+    full = pe.Obs([xsamp], ["ensemble"], idl=[range(0, length)])
+    full.gm()
+
+    even = pe.Obs([xsamp[0:length:2]], ["ensemble"], idl=[range(0, length, 2)])
+    odd = pe.Obs([xsamp[1:length:2]], ["ensemble"], idl=[range(1, length, 2)])
+
+    average = (even + odd) / 2
+    average.gm(S=0)
+    assert np.isclose(full.dvalue, average.dvalue, rtol=0.01)
+
+
+def test_non_overlapping_product():
+    length = 100000
+
+    samples = np.random.normal(0.93, 0.5, length)
+
+    e = pe.Obs([samples[0:length:2]], ["ensemble"], idl=[range(0, length, 2)])
+    o = pe.Obs([samples[1:length:2]], ["ensemble"], idl=[range(1, length, 2)])
+    prod1 = e * o
+    prod1.gm(S=0)
+
+    e2 = pe.Obs([samples[0:length:2]], ["even"])
+    o2 = pe.Obs([samples[1:length:2]], ["odd"])
+    prod2 = e2 * o2
+    prod2.gm(S=0)
+
+    assert np.isclose(prod1.dvalue, prod2.dvalue, rtol=0.01)

From 79d185aa7d039a9c40a681edb9be647b1edaeb86 Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Thu, 2 Feb 2023 13:57:58 +0000
Subject: [PATCH 5/9] test: non_overlapping tests refined.

---
 tests/obs_test.py | 23 +++++++++++++++++------
 1 file changed, 17 insertions(+), 6 deletions(-)

diff --git a/tests/obs_test.py b/tests/obs_test.py
index bb93538f..92002c2b 100644
--- a/tests/obs_test.py
+++ b/tests/obs_test.py
@@ -1086,19 +1086,30 @@ def test_non_overlapping_missing_cnfgs():
     assert np.isclose(full.dvalue, average.dvalue, rtol=0.01)
 
 
-def test_non_overlapping_product():
+def test_non_overlapping_operations():
     length = 100000
 
     samples = np.random.normal(0.93, 0.5, length)
 
     e = pe.Obs([samples[0:length:2]], ["ensemble"], idl=[range(0, length, 2)])
     o = pe.Obs([samples[1:length:2]], ["ensemble"], idl=[range(1, length, 2)])
-    prod1 = e * o
-    prod1.gm(S=0)
+
 
     e2 = pe.Obs([samples[0:length:2]], ["even"])
     o2 = pe.Obs([samples[1:length:2]], ["odd"])
-    prod2 = e2 * o2
-    prod2.gm(S=0)
 
-    assert np.isclose(prod1.dvalue, prod2.dvalue, rtol=0.01)
+    for func in  [lambda a, b: a + b,
+                  lambda a, b: a - b,
+                  lambda a, b: a * b,
+                  lambda a, b: a / b,
+                  lambda a, b: a ** b]:
+
+        res1 = func(e, o)
+        res1.gm(S=0)
+        res2 = func(e2, o2)
+        res2.gm(S=0)
+
+        print(res1, res2)
+        print((res1.dvalue - res2.dvalue) / res1.dvalue)
+
+        assert np.isclose(res1.dvalue, res2.dvalue, rtol=0.01)

From e34d49d88d579879ddffb424fe218d6284252e9b Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Thu, 2 Feb 2023 14:19:16 +0000
Subject: [PATCH 6/9] test: additional test for non overlapping configurations
 added.

---
 tests/obs_test.py | 29 +++++++++++++++++++++++++++++
 1 file changed, 29 insertions(+)

diff --git a/tests/obs_test.py b/tests/obs_test.py
index 92002c2b..650045b9 100644
--- a/tests/obs_test.py
+++ b/tests/obs_test.py
@@ -1113,3 +1113,32 @@ def test_non_overlapping_operations():
         print((res1.dvalue - res2.dvalue) / res1.dvalue)
 
         assert np.isclose(res1.dvalue, res2.dvalue, rtol=0.01)
+
+
+def test_non_overlapping_operations_different_lengths():
+    length = 100000
+
+    samples = np.random.normal(0.93, 0.5, length)
+    first = samples[:length // 5]
+    second = samples[length // 5:]
+
+    f1 = pe.Obs([first], ["ensemble"], idl=[range(1, length // 5 + 1)])
+    s1 = pe.Obs([second], ["ensemble"], idl=[range(length // 5, length)])
+
+
+    f2 = pe.Obs([first], ["first"])
+    s2 = pe.Obs([second], ["second"])
+
+    for func in  [lambda a, b: a + b,
+                  lambda a, b: a - b,
+                  lambda a, b: a * b,
+                  lambda a, b: a / b,
+                  lambda a, b: a ** b,
+                  lambda a, b: a ** 2 + b ** 2 / a]:
+
+        res1 = func(f1, f1)
+        res1.gm(S=0)
+        res2 = func(f2, f2)
+        res2.gm(S=0)
+
+        assert np.isclose(res1.dvalue, res2.dvalue, rtol=0.01)

From dc5116aa2f6046144ac0f9d27e4c70b8d99d9bce Mon Sep 17 00:00:00 2001
From: Simon Kuberski <simon.kuberski@uni-muenster.de>
Date: Thu, 2 Feb 2023 15:31:46 +0100
Subject: [PATCH 7/9] dobs: Zeros are written if config is not part of the Obs,
 these are ignored on input

---
 pyerrors/input/dobs.py | 51 +++++++++++++++++++++---------------------
 tests/json_io_test.py  |  2 +-
 2 files changed, 27 insertions(+), 26 deletions(-)

diff --git a/pyerrors/input/dobs.py b/pyerrors/input/dobs.py
index bbba2cf0..5acda12b 100644
--- a/pyerrors/input/dobs.py
+++ b/pyerrors/input/dobs.py
@@ -397,7 +397,7 @@ def read_pobs(fname, full_output=False, gz=True, separator_insertion=None):
 
 
 # this is based on Mattia Bruno's implementation at https://github.com/mbruno46/pyobs/blob/master/pyobs/IO/xml.py
-def import_dobs_string(content, noempty=False, full_output=False, separator_insertion=True):
+def import_dobs_string(content, full_output=False, separator_insertion=True):
     """Import a list of Obs from a string in the Zeuthen dobs format.
 
     Tags are not written or recovered automatically.
@@ -406,9 +406,6 @@ def import_dobs_string(content, noempty=False, full_output=False, separator_inse
     ----------
     content : str
         XML string containing the data
-    noemtpy : bool
-        If True, ensembles with no contribution to the Obs are not included.
-        If False, ensembles are included as written in the file, possibly with vanishing entries.
     full_output : bool
         If True, a dict containing auxiliary information and the data is returned.
         If False, only the data is returned as list.
@@ -507,7 +504,11 @@ def import_dobs_string(content, noempty=False, full_output=False, separator_inse
 
     for name in names:
         for i in range(len(deltad[name])):
-            deltad[name][i] = np.array(deltad[name][i]) + mean[i]
+            tmp = np.zeros_like(deltad[name][i])
+            for j in range(len(deltad[name][i])):
+                if deltad[name][i][j] != 0.:
+                    tmp[j] = deltad[name][i][j] + mean[i]
+            deltad[name][i] = tmp
 
     res = []
     for i in range(len(mean)):
@@ -516,11 +517,19 @@ def import_dobs_string(content, noempty=False, full_output=False, separator_inse
         obs_names = []
         for name in names:
             h = np.unique(deltad[name][i])
-            if len(h) == 1 and np.all(h == mean[i]) and noempty:
+            if len(h) == 1 and np.all(h == mean[i]):
                 continue
-            deltas.append(deltad[name][i])
-            obs_names.append(name)
-            idl.append(idld[name])
+            repdeltas = []
+            repidl = []
+            for j in range(len(deltad[name][i])):
+                if deltad[name][i][j] != 0.:
+                    repdeltas.append(deltad[name][i][j])
+                    repidl.append(idld[name][j])
+            if len(repdeltas) > 0:
+                obs_names.append(name)
+                deltas.append(repdeltas)
+                idl.append(repidl)
+
         res.append(Obs(deltas, obs_names, idl=idl))
         res[-1]._value = mean[i]
     _check(len(e_names) == ne)
@@ -528,13 +537,10 @@ def import_dobs_string(content, noempty=False, full_output=False, separator_inse
     cnames = list(covd.keys())
     for i in range(len(res)):
         new_covobs = {name: Covobs(0, covd[name], name, grad=gradd[name][i]) for name in cnames}
-        if noempty:
-            for name in cnames:
-                if np.all(new_covobs[name].grad == 0):
-                    del new_covobs[name]
-            cnames_loc = list(new_covobs.keys())
-        else:
-            cnames_loc = cnames
+        for name in cnames:
+            if np.all(new_covobs[name].grad == 0):
+                del new_covobs[name]
+        cnames_loc = list(new_covobs.keys())
         for name in cnames_loc:
             res[i].names.append(name)
             res[i].shape[name] = 1
@@ -546,8 +552,6 @@ def import_dobs_string(content, noempty=False, full_output=False, separator_inse
             res[i].tag = symbol[i]
             if res[i].tag == 'None':
                 res[i].tag = None
-    if not noempty:
-        _check(len(res[0].covobs.keys()) == nc)
     if full_output:
         retd = {}
         tool = file_origin.get('tool', None)
@@ -568,7 +572,7 @@ def import_dobs_string(content, noempty=False, full_output=False, separator_inse
         return res
 
 
-def read_dobs(fname, noempty=False, full_output=False, gz=True, separator_insertion=True):
+def read_dobs(fname, full_output=False, gz=True, separator_insertion=True):
     """Import a list of Obs from an xml.gz file in the Zeuthen dobs format.
 
     Tags are not written or recovered automatically.
@@ -577,9 +581,6 @@ def read_dobs(fname, noempty=False, full_output=False, gz=True, separator_insert
     ----------
     fname : str
         Filename of the input file.
-    noemtpy : bool
-        If True, ensembles with no contribution to the Obs are not included.
-        If False, ensembles are included as written in the file.
     full_output : bool
         If True, a dict containing auxiliary information and the data is returned.
         If False, only the data is returned as list.
@@ -615,7 +616,7 @@ def read_dobs(fname, noempty=False, full_output=False, gz=True, separator_insert
         with open(fname, 'r') as fin:
             content = fin.read()
 
-    return import_dobs_string(content, noempty, full_output, separator_insertion=separator_insertion)
+    return import_dobs_string(content, full_output, separator_insertion=separator_insertion)
 
 
 def _dobsdict_to_xmlstring(d):
@@ -782,7 +783,7 @@ def create_dobs_string(obsl, name, spec='dobs v1.0', origin='', symbol=[], who=N
                     o = obsl[oi]
                     if repname in o.idl:
                         if counters[oi] < 0:
-                            num = offsets[oi]
+                            num = 0
                             if num == 0:
                                 data += '0 '
                             else:
@@ -798,7 +799,7 @@ def create_dobs_string(obsl, name, spec='dobs v1.0', origin='', symbol=[], who=N
                             if counters[oi] >= len(o.idl[repname]):
                                 counters[oi] = -1
                         else:
-                            num = offsets[oi]
+                            num = 0
                             if num == 0:
                                 data += '0 '
                             else:
diff --git a/tests/json_io_test.py b/tests/json_io_test.py
index a37ba80b..21a70162 100644
--- a/tests/json_io_test.py
+++ b/tests/json_io_test.py
@@ -339,7 +339,7 @@ def test_dobsio():
 
     dobsio.write_dobs(ol, fname, 'TEST')
 
-    rl = dobsio.read_dobs(fname, noempty=True)
+    rl = dobsio.read_dobs(fname)
     os.remove(fname + '.xml.gz')
     [o.gamma_method() for o in rl]
 

From 37b3498258abf08ac87009d46c6f163d539d4b0a Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Thu, 2 Feb 2023 14:38:43 +0000
Subject: [PATCH 8/9] fix: unused variable removed in dobs.py

---
 pyerrors/input/dobs.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/pyerrors/input/dobs.py b/pyerrors/input/dobs.py
index 5acda12b..4757baae 100644
--- a/pyerrors/input/dobs.py
+++ b/pyerrors/input/dobs.py
@@ -454,7 +454,6 @@ def import_dobs_string(content, full_output=False, separator_insertion=True):
     _check(dobs[4].tag == "ne")
     ne = int(dobs[4].text.strip())
     _check(dobs[5].tag == "nc")
-    nc = int(dobs[5].text.strip())
 
     idld = {}
     deltad = {}

From 37c59a198ef57bbd6eb4c7fa6cc0a2b81d5f6389 Mon Sep 17 00:00:00 2001
From: Fabian Joswig <fabian.joswig@ed.ac.uk>
Date: Thu, 2 Feb 2023 15:08:22 +0000
Subject: [PATCH 9/9] test: test for values added to non overlapping tests.

---
 tests/obs_test.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/obs_test.py b/tests/obs_test.py
index 650045b9..4741945a 100644
--- a/tests/obs_test.py
+++ b/tests/obs_test.py
@@ -1066,6 +1066,7 @@ def test_overlapping_missing_cnfgs():
 
     t2 = o1 + a2
     t2.gm(S=0)
+    assert np.isclose(t1.value, t2.value)
     assert np.isclose(t1.dvalue, t2.dvalue, rtol=0.01)
 
 
@@ -1083,6 +1084,7 @@ def test_non_overlapping_missing_cnfgs():
 
     average = (even + odd) / 2
     average.gm(S=0)
+    assert np.isclose(full.value, average.value)
     assert np.isclose(full.dvalue, average.dvalue, rtol=0.01)
 
 
@@ -1112,6 +1114,7 @@ def test_non_overlapping_operations():
         print(res1, res2)
         print((res1.dvalue - res2.dvalue) / res1.dvalue)
 
+        assert np.isclose(res1.value, res2.value)
         assert np.isclose(res1.dvalue, res2.dvalue, rtol=0.01)
 
 
@@ -1141,4 +1144,5 @@ def test_non_overlapping_operations_different_lengths():
         res2 = func(f2, f2)
         res2.gm(S=0)
 
+        assert np.isclose(res1.value, res2.value)
         assert np.isclose(res1.dvalue, res2.dvalue, rtol=0.01)