scikit-hep · andrzejnovak · Apr 1, 2022 · Apr 1, 2022 · Apr 1, 2022 · Apr 1, 2022
diff --git a/src/uproot/behaviors/TH1.py b/src/uproot/behaviors/TH1.py
@@ -14,6 +14,15 @@
 boost_axis_metadata = {"name": "fName", "label": "fTitle"}
 
 
+def _remove_nan_dims(array):
+    mask_axes = [
+        numpy.isnan(array).all(axis=tuple(numpy.delete(numpy.arange(array.ndim), i)))
+        for i in range(array.ndim)
+    ]
+    reshape_dim = [len(axis) - numpy.sum(axis) for axis in mask_axes]
+    return numpy.ma.masked_invalid(array).compressed().reshape(reshape_dim)
+
+
 def _boost_axis(axis, metadata):
     boost_histogram = uproot.extras.boost_histogram()
 
@@ -245,7 +254,7 @@ def values(self, flow=False):
             self._values = values
 
         if flow:
-            return values
+            return _remove_nan_dims(values)
         else:
             return values[1:-1]
 
@@ -268,7 +277,7 @@ def _values_variances(self, flow):
             self._variances = variances
 
         if flow:
-            return values, variances
+            return _remove_nan_dims(values), _remove_nan_dims(variances)
         else:
             return values[1:-1], variances[1:-1]
 

diff --git a/src/uproot/behaviors/TH2.py b/src/uproot/behaviors/TH2.py
@@ -9,7 +9,7 @@
 import numpy
 
 import uproot
-from uproot.behaviors.TH1 import boost_axis_metadata, boost_metadata
+from uproot.behaviors.TH1 import _remove_nan_dims, boost_axis_metadata, boost_metadata
 
 
 class TH2(uproot.behaviors.TH1.Histogram):
@@ -53,7 +53,7 @@ def values(self, flow=False):
             self._values = values
 
         if flow:
-            return values
+            return _remove_nan_dims(values)
         else:
             return values[1:-1, 1:-1]
 
@@ -76,7 +76,7 @@ def _values_variances(self, flow):
             self._variances = variances
 
         if flow:
-            return values, variances
+            return _remove_nan_dims(values), _remove_nan_dims(variances)
         else:
             return values[1:-1, 1:-1], variances[1:-1, 1:-1]
 

diff --git a/src/uproot/behaviors/TH3.py b/src/uproot/behaviors/TH3.py
@@ -9,7 +9,7 @@
 import numpy
 
 import uproot
-from uproot.behaviors.TH1 import boost_axis_metadata, boost_metadata
+from uproot.behaviors.TH1 import _remove_nan_dims, boost_axis_metadata, boost_metadata
 
 
 class TH3(uproot.behaviors.TH1.Histogram):
@@ -61,7 +61,8 @@ def values(self, flow=False):
             self._values = values
 
         if flow:
-            return values
+            # return values
+            return _remove_nan_dims(values)
         else:
             return values[1:-1, 1:-1, 1:-1]
 
@@ -84,7 +85,7 @@ def _values_variances(self, flow):
             self._variances = variances
 
         if flow:
-            return values, variances
+            return _remove_nan_dims(values), _remove_nan_dims(variances)
         else:
             return values[1:-1, 1:-1, 1:-1], variances[1:-1, 1:-1, 1:-1]
 

diff --git a/src/uproot/writing/identify.py b/src/uproot/writing/identify.py
@@ -262,6 +262,20 @@ def to_writable(obj):
             # using flow=True if supported
             data = obj.values(flow=True)
             fSumw2 = obj.variances(flow=True)
+            # pad flow bins
+            pad_dim = numpy.array(
+                [
+                    [1 - int(axis.traits.underflow) for axis in obj.axes],
+                    [1 - int(axis.traits.overflow) for axis in obj.axes],
+                ]
+            ).T
+            if numpy.sum(pad_dim) != 0:
+                data = numpy.pad(
+                    data, pad_dim, mode="constant", constant_values=numpy.nan
+                )
+                fSumw2 = numpy.pad(
+                    fSumw2, pad_dim, mode="constant", constant_values=numpy.nan
+                )
 
         except TypeError:
             # flow=True is not supported, fallback to allocate-and-fill
@@ -303,6 +317,12 @@ def to_writable(obj):
         # we're assuming the PlottableHistogram ensures data.shape == weights.shape
         assert data.shape == fSumw2.shape
 
+        # check values/bins dimensions
+        if ndim == 1:
+            assert len(data) == len(obj.axes[0].edges) + 1
+        else:
+            assert data.shape == tuple(len(axis.edges) + 1 for axis in obj.axes)
+
         # data are stored in transposed order for 2D and 3D
         data = data.T.reshape(-1)
         fSumw2 = fSumw2.T.reshape(-1)

diff --git a/tests/test_0422-hist-integration.py b/tests/test_0422-hist-integration.py
@@ -157,3 +157,53 @@ def test_regular_3d(tmp_path):
     assert h2.GetBinContent(8, 9, 2) == 0
     assert h2.GetBinContent(9, 8, 1) == 0
     f.Close()
+
+
+@pytest.mark.parametrize("overflow", [True, False])
+@pytest.mark.parametrize("underflow", [True, False])
+def test_flow_bin_writing(tmp_path, underflow, overflow):
+    newfile = os.path.join(tmp_path, "newfile.root")
+    tmp = (
+        hist.new.Reg(3, 1, 4, name="x", underflow=underflow, overflow=overflow)
+        .Weight()
+        .fill([0, 1, 2, 3, 4])
+    )
+
+    with uproot.recreate(newfile) as fout:
+        fout["h1"] = tmp
+
+    with uproot.open(newfile) as fin:
+        h1 = fin["h1"]
+
+    assert np.allclose(tmp.values(), h1.values())
+    assert np.allclose(tmp.values(flow=True), h1.values(flow=True))
+
+
+@pytest.mark.parametrize("under1", [True, False])
+@pytest.mark.parametrize("under2", [True, False])
+@pytest.mark.parametrize("under3", [True, False])
+@pytest.mark.parametrize("over1", [True, False])
+@pytest.mark.parametrize("over2", [True, False])
+@pytest.mark.parametrize("over3", [True, False])
+def test_flow_bin_writing_3d(tmp_path, under1, under2, under3, over1, over2, over3):
+    newfile = os.path.join(tmp_path, "newfile.root")
+    tmp = (
+        hist.Hist.new.Reg(3, 1, 4, name="x", underflow=under1, overflow=over1)
+        .Reg(3, 1, 4, name="y", underflow=under2, overflow=over2)
+        .Reg(3, 1, 4, name="z", underflow=under3, overflow=over3)
+        .Weight()
+        .fill(
+            [0, 1, 2, 3, 4],
+            [0, 1, 2, 3, 4],
+            [0, 1, 2, 3, 4],
+        )
+    )
+
+    with uproot.recreate(newfile) as fout:
+        fout["h1"] = tmp
+
+    with uproot.open(newfile) as fin:
+        h1 = fin["h1"]
+
+    assert np.allclose(tmp.values(), h1.values())
+    assert np.allclose(tmp.values(flow=True), h1.values(flow=True))