lsst-sitcom · erykoff · Nov 27, 2023 · Nov 22, 2023 · Nov 27, 2023
diff --git a/python/lsst/summit/utils/utils.py b/python/lsst/summit/utils/utils.py
@@ -1011,8 +1011,10 @@ def getQuantiles(data, nColors):
     if np.isnan(minVal):  # cdf calculation has failed because all data is nan
         return np.asarray([np.nan for _ in range(nColors)])
 
+    scale = (maxVal - minVal)/len(cdf)
+
     boundaries = np.asarray(
-        [np.argmax(cdf >= i) + minVal for i in range(nColors)] + [maxVal]
+        [np.argmax(cdf >= i)*scale + minVal for i in range(nColors)] + [maxVal]
     )
     return boundaries
 
@@ -1034,5 +1036,6 @@ def digitizeData(data, nColors=256):
         Scaled data in the [0, nColors - 1] range.
     """
     cdf, minVal, maxVal = getCdf(data, nColors - 1)
-    bins = np.floor((data - minVal)).astype(np.int64)
+    scale = (maxVal - minVal)/len(cdf)
+    bins = np.floor((data*scale - minVal)).astype(np.int64)
     return cdf[bins]
diff --git a/tests/test_utils.py b/tests/test_utils.py
@@ -233,8 +233,7 @@ def test_quantiles(self):
         # We understand that our algorithm gives very large rounding error
         # compared to the generic numpy method. But still test it.
         np.random.seed(1234)
-        # too big of a width violates the tolerance in the test to cap at 10k
-        dataRanges = [(50, 1, -1), (100_000, 5_000, -1), (5_000_000, 10_000, -2)]
+        dataRanges = [(50, 1, -1), (100_000, 5_000, -2), (5_000_000, 10_000, -2), (50_000, 100_000, -3)]
         colorRanges = [2, 256, 999]  # [very few, nominal, lots and an odd number]
         for nColors, (mean, width, decimal) in itertools.product(colorRanges, dataRanges):
             data = np.random.normal(mean, width, (100, 100))