From 0f29529da946cb662b082c9e34cfdcc8b9d88b74 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Fri, 18 Jul 2025 16:09:04 +1000
Subject: [PATCH 01/54] update to nanvar to use more stable algorithm if engine
 is flox

---
 flox/__init__.py       |   2 -
 flox/_version.py       |   1 +
 flox/aggregate_flox.py | 116 ++++++++++++++++++++++++++++++++++++++++-
 flox/aggregations.py   |  71 +++++++++++++++++++++----
 4 files changed, 178 insertions(+), 12 deletions(-)
 create mode 100644 flox/_version.py

diff --git a/flox/__init__.py b/flox/__init__.py
index 898c10e2..2ed80afc 100644
--- a/flox/__init__.py
+++ b/flox/__init__.py
@@ -13,7 +13,6 @@
     ReindexArrayType,
 )  # noqa
 
-
 def _get_version():
     __version__ = "999"
     try:
@@ -22,5 +21,4 @@ def _get_version():
         pass
     return __version__
 
-
 __version__ = _get_version()
diff --git a/flox/_version.py b/flox/_version.py
new file mode 100644
index 00000000..5b33c8a4
--- /dev/null
+++ b/flox/_version.py
@@ -0,0 +1 @@
+__version__ = "0.1.dev657+g619a390.d20250606"
\ No newline at end of file
diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index e470151a..ea1aa2c1 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -5,6 +5,86 @@
 from . import xrdtypes as dtypes
 from .xrutils import is_scalar, isnull, notnull
 
+MULTIARRAY_HANDLED_FUNCTIONS = {}
+
+class MultiArray:
+    arrays: tuple[np.ndarray, ...]
+
+    def __init__(self, arrays):
+        self.arrays = arrays # something else needed here to be more careful about types (not sure what)
+        # Do we want to co-erce arrays into a tuple and make sure it's immutable? Do we want it to be immutable?
+        assert np.all([arrays[0].shape == a.shape for a in arrays]), 'Expect all arrays to have the same shape'
+        
+    def astype(self,dt,**kwargs):
+        new_arrays = [] # I really don't like doing this as a list
+        for array in self.arrays: # Do we care about trying to avoid for loops here? three separate lines would be faster, but harder to read
+            new_arrays.append(array.astype(dt,**kwargs))
+        return MultiArray(new_arrays)
+    
+    def reshape(self,shape,**kwargs):
+        return MultiArray([array.reshape(shape,**kwargs) for array in self.arrays])
+    
+    def squeeze(self,axis=None):
+        return MultiArray([array.squeeze(axis) for array in self.arrays])    
+    
+    def __array_function__(self, func, types, args, kwargs):
+        if func not in MULTIARRAY_HANDLED_FUNCTIONS:
+            return NotImplemented
+        # Note: this allows subclasses that don't override
+        # __array_function__ to handle MyArray objects
+        #if not all(issubclass(t, MyArray) for t in types): # I can't see this being relevant at all for this code, but maybe it's safer to leave it in?
+            #return NotImplemented
+        return MULTIARRAY_HANDLED_FUNCTIONS[func](*args, **kwargs)    
+
+        
+   # Shape is needed, seems likely that the other two might be
+   # Making some strong assumptions here that all the arrays are the same shape, and I don't really like this
+    @property
+    def dtype(self) -> np.dtype:
+        return self.arrays[0].dtype
+
+    @property
+    def shape(self) -> tuple[int, ...]:
+        return self.arrays[0].shape
+
+    @property
+    def ndim(self) -> int:
+        return self.arrays[0].ndim
+
+def implements(numpy_function):
+    """Register an __array_function__ implementation for MyArray objects."""
+    def decorator(func):
+        MULTIARRAY_HANDLED_FUNCTIONS[numpy_function] = func
+        return func
+    return decorator
+
+@implements(np.expand_dims)
+def expand_dims_MultiArray(multiarray,axis):
+    return MultiArray([np.expand_dims(a,axis) for a in multiarray.arrays]) #This is gonna spit out a list and I'm not sure if I'm okay with that?
+
+@implements(np.concatenate)
+def concatenate_MultiArray(multiarrays,axis):
+    
+    n_arrays = len(multiarrays[0].arrays)
+    for ma in multiarrays[1:]:
+        if not (len(ma.arrays) == n_arrays): # I don't know what trying to concatenate MultiArrays with different numbers of arrays would even mean
+            raise NotImplementedError
+      
+    # There's the potential for problematic different shapes coming in here.  
+    # Probably warrants some defensive programming, but I'm not sure what to check for while still being generic
+    
+    # I don't like using append and lists here, but I can't work out how to do it better
+    new_arrays = []
+    for i in range(multiarrays[0].ndim):
+        new_arrays.append(np.concatenate([ma.arrays[i] for ma in multiarrays],axis))
+    
+    out = MultiArray(new_arrays)
+    return out
+
+@implements(np.transpose)
+def transpose_MultiArray(multiarray,axes):
+    return MultiArray([np.transpose(a,axes) for a in multiarray.arrays]) #This is gonna spit out a list and I'm not sure if I'm okay with that?
+
 
 def _prepare_for_flox(group_idx, array):
     """
@@ -206,7 +286,6 @@ def _nan_grouped_op(group_idx, array, func, fillna, *args, **kwargs):
 nanmedian = partial(partial(_np_grouped_op, q=0.5), op=partial(quantile_, skipna=True))
 # TODO: all, any
 
-
 def sum_of_squares(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None):
     return sum(
         group_idx,
@@ -250,6 +329,41 @@ def nanmean(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None
         out /= nanlen(group_idx, array, size=size, axis=axis, fill_value=0)
     return out
 
+def var_chunk(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None):
+    # Calculate length and sum - important for the adjustment terms to sum squared deviations
+    array_lens = nanlen(
+        group_idx,
+        array,
+        axis=axis,
+        size=size,
+        fill_value=fill_value,
+        dtype=dtype,
+    )
+    
+    array_sums = sum(
+        group_idx,
+        array,
+        axis=axis,
+        size=size,
+        fill_value=fill_value,
+        dtype=dtype,
+    )
+    
+    # Calculate sum squared deviations - the main part of variance sum
+    array_means = array_sums/array_lens # Does this risk being run eagerly because it's not wrapped in anything?
+    
+    sum_squared_deviations = sum(
+        group_idx,
+        (array-array_means[..., group_idx])**2,
+        axis=axis,
+        size=size,
+        fill_value=fill_value,
+        dtype=dtype,
+    ) 
+
+    return MultiArray((sum_squared_deviations,array_sums,array_lens))
+
+
 
 def ffill(group_idx, array, *, axis, **kwargs):
     group_idx, array, perm = _prepare_for_flox(group_idx, array)
diff --git a/flox/aggregations.py b/flox/aggregations.py
index 6182d6bd..56aec6a5 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -342,14 +342,57 @@ def _mean_finalize(sum_, count):
     final_dtype=np.floating,
 )
 
-
+def _var_combine(array, axis, keepdims=True):
+    
+    def clip_last(array):
+        '''Return array except the last element along axis
+        Purely included to tidy up the adj_terms line
+        '''
+        not_last = [slice(None,None) for i in range(array.ndim)]
+        not_last[axis[0]] = slice(None,-1)
+        return array[*not_last]
+    def clip_first(array):
+        '''Return array except the first element along axis
+        Purely included to tidy up the adj_terms line
+        '''        
+        not_first = [slice(None,None) for i in range(array.ndim)]
+        not_first[axis[0]] = slice(1,None)        
+        return array[*not_first]    
+    
+    assert len(axis)==1, "Assuming that the combine function is only in one direction at once"
+    
+    # Does this double our memory footprint or are they just views?
+    # If there's a huge memory impact, probably better to copy paste array.arrays[1]
+    # in and accept the hit to readability
+    sum_deviations = array.arrays[0]
+    sum_X = array.arrays[1]
+    sum_len = array.arrays[2]    
+    
+    # Calculate parts needed for cascading combination
+    cumsum_X = np.cumsum(sum_X,axis=axis[0]) #Don't need to be able to merge the last element
+    cumsum_len = np.cumsum(sum_len,axis=axis[0])
+
+
+    # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
+    adj_terms = ((clip_last(cumsum_len)*clip_first(sum_X)-clip_first(sum_len)*clip_last(cumsum_X))**2/
+                 (clip_last(cumsum_len)*clip_first(sum_len)*(clip_last(cumsum_len)+clip_first(sum_len))))
+    
+
+
+    return aggregate_flox.MultiArray((np.sum(sum_deviations,axis=axis,keepdims=keepdims)+np.sum(adj_terms,axis=axis,keepdims=keepdims), # sum of squared deviations
+                                      np.sum(sum_X,axis=axis,keepdims=keepdims),           # sum of array items
+                                      np.sum(sum_len,axis=axis,keepdims=keepdims),           # sum of array lengths
+                                        ))# I'm not even pretending calling this class from there is a good idea, I think it wants to be somewhere else though
+    
 # TODO: fix this for complex numbers
-def _var_finalize(sumsq, sum_, count, ddof=0):
-    with np.errstate(invalid="ignore", divide="ignore"):
-        result = (sumsq - (sum_**2 / count)) / (count - ddof)
-    result[count <= ddof] = np.nan
-    return result
+#def _var_finalize(sumsq, sum_, count, ddof=0):
+    #with np.errstate(invalid="ignore", divide="ignore"):
+        #result = (sumsq - (sum_**2 / count)) / (count - ddof)
+    #result[count <= ddof] = np.nan
+    #return result
 
+def _var_finalize(multiarray,ddof=0):
+    return multiarray.arrays[0]/(multiarray.arrays[2]-ddof) # Is this how ddof works again???
 
 def _std_finalize(sumsq, sum_, count, ddof=0):
     return np.sqrt(_var_finalize(sumsq, sum_, count, ddof))
@@ -366,14 +409,24 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
     dtypes=(None, None, np.intp),
     final_dtype=np.floating,
 )
+#nanvar = Aggregation(
+    #"nanvar",
+    #chunk=("nansum_of_squares", "nansum", "nanlen"),
+    #combine=("sum", "sum", "sum"),
+    #finalize=_var_finalize,
+    #fill_value=0,
+    #final_fill_value=np.nan,
+    #dtypes=(None, None, np.intp),
+    #final_dtype=np.floating,
+#)
 nanvar = Aggregation(
     "nanvar",
-    chunk=("nansum_of_squares", "nansum", "nanlen"),
-    combine=("sum", "sum", "sum"),
+    chunk=("var_chunk"),
+    combine=(_var_combine,),
     finalize=_var_finalize,
     fill_value=0,
     final_fill_value=np.nan,
-    dtypes=(None, None, np.intp),
+    dtypes=(None, ),
     final_dtype=np.floating,
 )
 std = Aggregation(

From 1fbf5f85a192c2cfd322f7095ed724b6b6112689 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Fri, 18 Jul 2025 06:26:35 +0000
Subject: [PATCH 02/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/__init__.py       |  2 +
 flox/_version.py       |  2 +-
 flox/aggregate_flox.py | 96 ++++++++++++++++++++++++------------------
 flox/aggregations.py   | 94 ++++++++++++++++++++++-------------------
 4 files changed, 109 insertions(+), 85 deletions(-)

diff --git a/flox/__init__.py b/flox/__init__.py
index 2ed80afc..898c10e2 100644
--- a/flox/__init__.py
+++ b/flox/__init__.py
@@ -13,6 +13,7 @@
     ReindexArrayType,
 )  # noqa
 
+
 def _get_version():
     __version__ = "999"
     try:
@@ -21,4 +22,5 @@ def _get_version():
         pass
     return __version__
 
+
 __version__ = _get_version()
diff --git a/flox/_version.py b/flox/_version.py
index 5b33c8a4..a76cf84b 100644
--- a/flox/_version.py
+++ b/flox/_version.py
@@ -1 +1 @@
-__version__ = "0.1.dev657+g619a390.d20250606"
\ No newline at end of file
+__version__ = "0.1.dev657+g619a390.d20250606"
diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index ea1aa2c1..d5f0084c 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -7,38 +7,40 @@
 
 MULTIARRAY_HANDLED_FUNCTIONS = {}
 
+
 class MultiArray:
     arrays: tuple[np.ndarray, ...]
 
     def __init__(self, arrays):
-        self.arrays = arrays # something else needed here to be more careful about types (not sure what)
+        self.arrays = arrays  # something else needed here to be more careful about types (not sure what)
         # Do we want to co-erce arrays into a tuple and make sure it's immutable? Do we want it to be immutable?
-        assert np.all([arrays[0].shape == a.shape for a in arrays]), 'Expect all arrays to have the same shape'
-        
-    def astype(self,dt,**kwargs):
-        new_arrays = [] # I really don't like doing this as a list
-        for array in self.arrays: # Do we care about trying to avoid for loops here? three separate lines would be faster, but harder to read
-            new_arrays.append(array.astype(dt,**kwargs))
+        assert np.all([arrays[0].shape == a.shape for a in arrays]), (
+            "Expect all arrays to have the same shape"
+        )
+
+    def astype(self, dt, **kwargs):
+        new_arrays = []  # I really don't like doing this as a list
+        for array in self.arrays:  # Do we care about trying to avoid for loops here? three separate lines would be faster, but harder to read
+            new_arrays.append(array.astype(dt, **kwargs))
         return MultiArray(new_arrays)
-    
-    def reshape(self,shape,**kwargs):
-        return MultiArray([array.reshape(shape,**kwargs) for array in self.arrays])
-    
-    def squeeze(self,axis=None):
-        return MultiArray([array.squeeze(axis) for array in self.arrays])    
-    
+
+    def reshape(self, shape, **kwargs):
+        return MultiArray([array.reshape(shape, **kwargs) for array in self.arrays])
+
+    def squeeze(self, axis=None):
+        return MultiArray([array.squeeze(axis) for array in self.arrays])
+
     def __array_function__(self, func, types, args, kwargs):
         if func not in MULTIARRAY_HANDLED_FUNCTIONS:
             return NotImplemented
         # Note: this allows subclasses that don't override
         # __array_function__ to handle MyArray objects
-        #if not all(issubclass(t, MyArray) for t in types): # I can't see this being relevant at all for this code, but maybe it's safer to leave it in?
-            #return NotImplemented
-        return MULTIARRAY_HANDLED_FUNCTIONS[func](*args, **kwargs)    
+        # if not all(issubclass(t, MyArray) for t in types): # I can't see this being relevant at all for this code, but maybe it's safer to leave it in?
+        # return NotImplemented
+        return MULTIARRAY_HANDLED_FUNCTIONS[func](*args, **kwargs)
 
-        
-   # Shape is needed, seems likely that the other two might be
-   # Making some strong assumptions here that all the arrays are the same shape, and I don't really like this
+    # Shape is needed, seems likely that the other two might be
+    # Making some strong assumptions here that all the arrays are the same shape, and I don't really like this
     @property
     def dtype(self) -> np.dtype:
         return self.arrays[0].dtype
@@ -51,39 +53,50 @@ def shape(self) -> tuple[int, ...]:
     def ndim(self) -> int:
         return self.arrays[0].ndim
 
+
 def implements(numpy_function):
     """Register an __array_function__ implementation for MyArray objects."""
+
     def decorator(func):
         MULTIARRAY_HANDLED_FUNCTIONS[numpy_function] = func
         return func
+
     return decorator
 
+
 @implements(np.expand_dims)
-def expand_dims_MultiArray(multiarray,axis):
-    return MultiArray([np.expand_dims(a,axis) for a in multiarray.arrays]) #This is gonna spit out a list and I'm not sure if I'm okay with that?
+def expand_dims_MultiArray(multiarray, axis):
+    return MultiArray(
+        [np.expand_dims(a, axis) for a in multiarray.arrays]
+    )  # This is gonna spit out a list and I'm not sure if I'm okay with that?
+
 
 @implements(np.concatenate)
-def concatenate_MultiArray(multiarrays,axis):
-    
+def concatenate_MultiArray(multiarrays, axis):
     n_arrays = len(multiarrays[0].arrays)
     for ma in multiarrays[1:]:
-        if not (len(ma.arrays) == n_arrays): # I don't know what trying to concatenate MultiArrays with different numbers of arrays would even mean
+        if not (
+            len(ma.arrays) == n_arrays
+        ):  # I don't know what trying to concatenate MultiArrays with different numbers of arrays would even mean
             raise NotImplementedError
-      
-    # There's the potential for problematic different shapes coming in here.  
+
+    # There's the potential for problematic different shapes coming in here.
     # Probably warrants some defensive programming, but I'm not sure what to check for while still being generic
-    
+
     # I don't like using append and lists here, but I can't work out how to do it better
     new_arrays = []
     for i in range(multiarrays[0].ndim):
-        new_arrays.append(np.concatenate([ma.arrays[i] for ma in multiarrays],axis))
-    
+        new_arrays.append(np.concatenate([ma.arrays[i] for ma in multiarrays], axis))
+
     out = MultiArray(new_arrays)
     return out
 
+
 @implements(np.transpose)
-def transpose_MultiArray(multiarray,axes):
-    return MultiArray([np.transpose(a,axes) for a in multiarray.arrays]) #This is gonna spit out a list and I'm not sure if I'm okay with that?
+def transpose_MultiArray(multiarray, axes):
+    return MultiArray(
+        [np.transpose(a, axes) for a in multiarray.arrays]
+    )  # This is gonna spit out a list and I'm not sure if I'm okay with that?
 
 
 def _prepare_for_flox(group_idx, array):
@@ -286,6 +299,7 @@ def _nan_grouped_op(group_idx, array, func, fillna, *args, **kwargs):
 nanmedian = partial(partial(_np_grouped_op, q=0.5), op=partial(quantile_, skipna=True))
 # TODO: all, any
 
+
 def sum_of_squares(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None):
     return sum(
         group_idx,
@@ -329,6 +343,7 @@ def nanmean(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None
         out /= nanlen(group_idx, array, size=size, axis=axis, fill_value=0)
     return out
 
+
 def var_chunk(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None):
     # Calculate length and sum - important for the adjustment terms to sum squared deviations
     array_lens = nanlen(
@@ -339,7 +354,7 @@ def var_chunk(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=No
         fill_value=fill_value,
         dtype=dtype,
     )
-    
+
     array_sums = sum(
         group_idx,
         array,
@@ -348,21 +363,22 @@ def var_chunk(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=No
         fill_value=fill_value,
         dtype=dtype,
     )
-    
+
     # Calculate sum squared deviations - the main part of variance sum
-    array_means = array_sums/array_lens # Does this risk being run eagerly because it's not wrapped in anything?
-    
+    array_means = (
+        array_sums / array_lens
+    )  # Does this risk being run eagerly because it's not wrapped in anything?
+
     sum_squared_deviations = sum(
         group_idx,
-        (array-array_means[..., group_idx])**2,
+        (array - array_means[..., group_idx]) ** 2,
         axis=axis,
         size=size,
         fill_value=fill_value,
         dtype=dtype,
-    ) 
-
-    return MultiArray((sum_squared_deviations,array_sums,array_lens))
+    )
 
+    return MultiArray((sum_squared_deviations, array_sums, array_lens))
 
 
 def ffill(group_idx, array, *, axis, **kwargs):
diff --git a/flox/aggregations.py b/flox/aggregations.py
index 56aec6a5..f95428d6 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -342,57 +342,63 @@ def _mean_finalize(sum_, count):
     final_dtype=np.floating,
 )
 
+
 def _var_combine(array, axis, keepdims=True):
-    
     def clip_last(array):
-        '''Return array except the last element along axis
+        """Return array except the last element along axis
         Purely included to tidy up the adj_terms line
-        '''
-        not_last = [slice(None,None) for i in range(array.ndim)]
-        not_last[axis[0]] = slice(None,-1)
+        """
+        not_last = [slice(None, None) for i in range(array.ndim)]
+        not_last[axis[0]] = slice(None, -1)
         return array[*not_last]
+
     def clip_first(array):
-        '''Return array except the first element along axis
+        """Return array except the first element along axis
         Purely included to tidy up the adj_terms line
-        '''        
-        not_first = [slice(None,None) for i in range(array.ndim)]
-        not_first[axis[0]] = slice(1,None)        
-        return array[*not_first]    
-    
-    assert len(axis)==1, "Assuming that the combine function is only in one direction at once"
-    
+        """
+        not_first = [slice(None, None) for i in range(array.ndim)]
+        not_first[axis[0]] = slice(1, None)
+        return array[*not_first]
+
+    assert len(axis) == 1, "Assuming that the combine function is only in one direction at once"
+
     # Does this double our memory footprint or are they just views?
     # If there's a huge memory impact, probably better to copy paste array.arrays[1]
     # in and accept the hit to readability
     sum_deviations = array.arrays[0]
     sum_X = array.arrays[1]
-    sum_len = array.arrays[2]    
-    
-    # Calculate parts needed for cascading combination
-    cumsum_X = np.cumsum(sum_X,axis=axis[0]) #Don't need to be able to merge the last element
-    cumsum_len = np.cumsum(sum_len,axis=axis[0])
+    sum_len = array.arrays[2]
 
+    # Calculate parts needed for cascading combination
+    cumsum_X = np.cumsum(sum_X, axis=axis[0])  # Don't need to be able to merge the last element
+    cumsum_len = np.cumsum(sum_len, axis=axis[0])
 
     # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
-    adj_terms = ((clip_last(cumsum_len)*clip_first(sum_X)-clip_first(sum_len)*clip_last(cumsum_X))**2/
-                 (clip_last(cumsum_len)*clip_first(sum_len)*(clip_last(cumsum_len)+clip_first(sum_len))))
-    
+    adj_terms = (
+        clip_last(cumsum_len) * clip_first(sum_X) - clip_first(sum_len) * clip_last(cumsum_X)
+    ) ** 2 / (clip_last(cumsum_len) * clip_first(sum_len) * (clip_last(cumsum_len) + clip_first(sum_len)))
+
+    return aggregate_flox.MultiArray(
+        (
+            np.sum(sum_deviations, axis=axis, keepdims=keepdims)
+            + np.sum(adj_terms, axis=axis, keepdims=keepdims),  # sum of squared deviations
+            np.sum(sum_X, axis=axis, keepdims=keepdims),  # sum of array items
+            np.sum(sum_len, axis=axis, keepdims=keepdims),  # sum of array lengths
+        )
+    )  # I'm not even pretending calling this class from there is a good idea, I think it wants to be somewhere else though
 
 
-    return aggregate_flox.MultiArray((np.sum(sum_deviations,axis=axis,keepdims=keepdims)+np.sum(adj_terms,axis=axis,keepdims=keepdims), # sum of squared deviations
-                                      np.sum(sum_X,axis=axis,keepdims=keepdims),           # sum of array items
-                                      np.sum(sum_len,axis=axis,keepdims=keepdims),           # sum of array lengths
-                                        ))# I'm not even pretending calling this class from there is a good idea, I think it wants to be somewhere else though
-    
 # TODO: fix this for complex numbers
-#def _var_finalize(sumsq, sum_, count, ddof=0):
-    #with np.errstate(invalid="ignore", divide="ignore"):
-        #result = (sumsq - (sum_**2 / count)) / (count - ddof)
-    #result[count <= ddof] = np.nan
-    #return result
+# def _var_finalize(sumsq, sum_, count, ddof=0):
+# with np.errstate(invalid="ignore", divide="ignore"):
+# result = (sumsq - (sum_**2 / count)) / (count - ddof)
+# result[count <= ddof] = np.nan
+# return result
+
+
+def _var_finalize(multiarray, ddof=0):
+    return multiarray.arrays[0] / (multiarray.arrays[2] - ddof)  # Is this how ddof works again???
 
-def _var_finalize(multiarray,ddof=0):
-    return multiarray.arrays[0]/(multiarray.arrays[2]-ddof) # Is this how ddof works again???
 
 def _std_finalize(sumsq, sum_, count, ddof=0):
     return np.sqrt(_var_finalize(sumsq, sum_, count, ddof))
@@ -409,16 +415,16 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
     dtypes=(None, None, np.intp),
     final_dtype=np.floating,
 )
-#nanvar = Aggregation(
-    #"nanvar",
-    #chunk=("nansum_of_squares", "nansum", "nanlen"),
-    #combine=("sum", "sum", "sum"),
-    #finalize=_var_finalize,
-    #fill_value=0,
-    #final_fill_value=np.nan,
-    #dtypes=(None, None, np.intp),
-    #final_dtype=np.floating,
-#)
+# nanvar = Aggregation(
+# "nanvar",
+# chunk=("nansum_of_squares", "nansum", "nanlen"),
+# combine=("sum", "sum", "sum"),
+# finalize=_var_finalize,
+# fill_value=0,
+# final_fill_value=np.nan,
+# dtypes=(None, None, np.intp),
+# final_dtype=np.floating,
+# )
 nanvar = Aggregation(
     "nanvar",
     chunk=("var_chunk"),
@@ -426,7 +432,7 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
     finalize=_var_finalize,
     fill_value=0,
     final_fill_value=np.nan,
-    dtypes=(None, ),
+    dtypes=(None,),
     final_dtype=np.floating,
 )
 std = Aggregation(

From 322f5115509c2127316cc051fdf55c1b804b96cc Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Fri, 18 Jul 2025 09:47:42 -0600
Subject: [PATCH 03/54] [revert] only nanvar test

---
 tests/test_core.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_core.py b/tests/test_core.py
index 88169c0f..7545480b 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -235,7 +235,7 @@ def gen_array_by(size, func):
 @pytest.mark.parametrize("size", [(1, 12), (12,), (12, 9)])
 @pytest.mark.parametrize("nby", [1, 2, 3])
 @pytest.mark.parametrize("add_nan_by", [True, False])
-@pytest.mark.parametrize("func", ALL_FUNCS)
+@pytest.mark.parametrize("func", ["nanvar"])
 def test_groupby_reduce_all(to_sparse, nby, size, chunks, func, add_nan_by, engine):
     if ("arg" in func and engine in ["flox", "numbagg"]) or (func in BLOCKWISE_FUNCS and chunks != -1):
         pytest.skip()

From adab8e68b2823d8cba82ff279332fc1e4bf5e858 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Fri, 18 Jul 2025 09:49:10 -0600
Subject: [PATCH 04/54] Some mods

---
 flox/aggregate_flox.py | 41 ++++--------------------------------
 flox/aggregations.py   | 48 +++++++++++++++++++++++++++++++++++++++++-
 flox/core.py           |  8 ++++++-
 3 files changed, 58 insertions(+), 39 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index d5f0084c..41309fcf 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -1,4 +1,5 @@
 from functools import partial
+from typing import Self
 
 import numpy as np
 
@@ -53,6 +54,9 @@ def shape(self) -> tuple[int, ...]:
     def ndim(self) -> int:
         return self.arrays[0].ndim
 
+    def __getitem__(self, key) -> Self:
+        return type(self)([array[key] for array in self.arrays])
+
 
 def implements(numpy_function):
     """Register an __array_function__ implementation for MyArray objects."""
@@ -344,43 +348,6 @@ def nanmean(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None
     return out
 
 
-def var_chunk(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None):
-    # Calculate length and sum - important for the adjustment terms to sum squared deviations
-    array_lens = nanlen(
-        group_idx,
-        array,
-        axis=axis,
-        size=size,
-        fill_value=fill_value,
-        dtype=dtype,
-    )
-
-    array_sums = sum(
-        group_idx,
-        array,
-        axis=axis,
-        size=size,
-        fill_value=fill_value,
-        dtype=dtype,
-    )
-
-    # Calculate sum squared deviations - the main part of variance sum
-    array_means = (
-        array_sums / array_lens
-    )  # Does this risk being run eagerly because it's not wrapped in anything?
-
-    sum_squared_deviations = sum(
-        group_idx,
-        (array - array_means[..., group_idx]) ** 2,
-        axis=axis,
-        size=size,
-        fill_value=fill_value,
-        dtype=dtype,
-    )
-
-    return MultiArray((sum_squared_deviations, array_sums, array_lens))
-
-
 def ffill(group_idx, array, *, axis, **kwargs):
     group_idx, array, perm = _prepare_for_flox(group_idx, array)
     shape = array.shape
diff --git a/flox/aggregations.py b/flox/aggregations.py
index f95428d6..0961d13a 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -343,6 +343,51 @@ def _mean_finalize(sum_, count):
 )
 
 
+def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=None, dtype=None):
+    from .aggregate_flox import MultiArray
+
+    # Calculate length and sum - important for the adjustment terms to sum squared deviations
+    array_lens = generic_aggregate(
+        group_idx,
+        array,
+        func="nanlen",
+        engine=engine,
+        axis=axis,
+        size=size,
+        fill_value=fill_value,
+        dtype=dtype,
+    )
+
+    array_sums = generic_aggregate(
+        group_idx,
+        array,
+        func="nansum",
+        engine=engine,
+        axis=axis,
+        size=size,
+        fill_value=fill_value,
+        dtype=dtype,
+    )
+
+    # Calculate sum squared deviations - the main part of variance sum
+    array_means = (
+        array_sums / array_lens
+    )  # Does this risk being run eagerly because it's not wrapped in anything?
+
+    sum_squared_deviations = generic_aggregate(
+        group_idx,
+        (array - array_means[..., group_idx]) ** 2,
+        func="nansum",
+        engine=engine,
+        axis=axis,
+        size=size,
+        fill_value=fill_value,
+        dtype=dtype,
+    )
+
+    return MultiArray((sum_squared_deviations, array_sums, array_lens))
+
+
 def _var_combine(array, axis, keepdims=True):
     def clip_last(array):
         """Return array except the last element along axis
@@ -427,7 +472,8 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
 # )
 nanvar = Aggregation(
     "nanvar",
-    chunk=("var_chunk"),
+    chunk=var_chunk,
+    numpy="nanvar",
     combine=(_var_combine,),
     finalize=_var_finalize,
     fill_value=0,
diff --git a/flox/core.py b/flox/core.py
index d8600b37..f8d724a1 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -46,6 +46,7 @@
     _initialize_aggregation,
     generic_aggregate,
     quantile_new_dims_func,
+    var_chunk,
 )
 from .cache import memoize
 from .lib import ArrayLayer, dask_array_type, sparse_array_type
@@ -1251,7 +1252,8 @@ def chunk_reduce(
     # optimize that out.
     previous_reduction: T_Func = ""
     for reduction, fv, kw, dt in zip(funcs, fill_values, kwargss, dtypes):
-        if empty:
+        # UGLY! but this is because the `var` breaks our design assumptions
+        if empty and reduction is not var_chunk:
             result = np.full(shape=final_array_shape, fill_value=fv, like=array)
         elif is_nanlen(reduction) and is_nanlen(previous_reduction):
             result = results["intermediates"][-1]
@@ -1260,6 +1262,10 @@ def chunk_reduce(
             kw_func = dict(size=size, dtype=dt, fill_value=fv)
             kw_func.update(kw)
 
+            # UGLY! but this is because the `var` breaks our design assumptions
+            if reduction is var_chunk:
+                kw_func.update(engine=engine)
+
             if callable(reduction):
                 # passing a custom reduction for npg to apply per-group is really slow!
                 # So this `reduction` has to do the groupby-aggregation

From 93cd9b309277a9512f6d63e251e27c5b5ef00dd3 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Mon, 21 Jul 2025 12:11:31 +1000
Subject: [PATCH 05/54] Update flox/aggregations.py to neater tuple unpacking

Co-authored-by: Deepak Cherian <dcherian@users.noreply.github.com>
---
 flox/aggregations.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 0961d13a..f989571f 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -410,9 +410,7 @@ def clip_first(array):
     # Does this double our memory footprint or are they just views?
     # If there's a huge memory impact, probably better to copy paste array.arrays[1]
     # in and accept the hit to readability
-    sum_deviations = array.arrays[0]
-    sum_X = array.arrays[1]
-    sum_len = array.arrays[2]
+   sum_deviations, sum_X, sum_len = array.arrays
 
     # Calculate parts needed for cascading combination
     cumsum_X = np.cumsum(sum_X, axis=axis[0])  # Don't need to be able to merge the last element

From 2be4f744d8eb97f7ba4ac27fd2ec4ba5bcacf0bc Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Mon, 21 Jul 2025 12:19:10 +1000
Subject: [PATCH 06/54] Change np.all to all in  flox/aggregate_flox.py

Co-authored-by: Deepak Cherian <dcherian@users.noreply.github.com>
---
 flox/aggregate_flox.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index 41309fcf..ce128d28 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -15,7 +15,7 @@ class MultiArray:
     def __init__(self, arrays):
         self.arrays = arrays  # something else needed here to be more careful about types (not sure what)
         # Do we want to co-erce arrays into a tuple and make sure it's immutable? Do we want it to be immutable?
-        assert np.all([arrays[0].shape == a.shape for a in arrays]), (
+        assert all(arrays[0].shape == a.shape for a in arrays), (
             "Expect all arrays to have the same shape"
         )
 

From edb655dd1f9bd661e9b16b1146cb1fd380cd7380 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Mon, 21 Jul 2025 02:19:17 +0000
Subject: [PATCH 07/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregate_flox.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index ce128d28..21cbd111 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -15,9 +15,7 @@ class MultiArray:
     def __init__(self, arrays):
         self.arrays = arrays  # something else needed here to be more careful about types (not sure what)
         # Do we want to co-erce arrays into a tuple and make sure it's immutable? Do we want it to be immutable?
-        assert all(arrays[0].shape == a.shape for a in arrays), (
-            "Expect all arrays to have the same shape"
-        )
+        assert all(arrays[0].shape == a.shape for a in arrays), "Expect all arrays to have the same shape"
 
     def astype(self, dt, **kwargs):
         new_arrays = []  # I really don't like doing this as a list

From dd2e4b6a30784fca103d593c4b96c6056d72f6d9 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Mon, 21 Jul 2025 12:24:19 +1000
Subject: [PATCH 08/54] delete some resolved comments

---
 flox/aggregate_flox.py | 2 +-
 flox/aggregations.py   | 3 ---
 2 files changed, 1 insertion(+), 4 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index ea1aa2c1..fa5a9501 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -350,7 +350,7 @@ def var_chunk(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=No
     )
     
     # Calculate sum squared deviations - the main part of variance sum
-    array_means = array_sums/array_lens # Does this risk being run eagerly because it's not wrapped in anything?
+    array_means = array_sums/array_lens
     
     sum_squared_deviations = sum(
         group_idx,
diff --git a/flox/aggregations.py b/flox/aggregations.py
index 56aec6a5..10cb8add 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -361,9 +361,6 @@ def clip_first(array):
     
     assert len(axis)==1, "Assuming that the combine function is only in one direction at once"
     
-    # Does this double our memory footprint or are they just views?
-    # If there's a huge memory impact, probably better to copy paste array.arrays[1]
-    # in and accept the hit to readability
     sum_deviations = array.arrays[0]
     sum_X = array.arrays[1]
     sum_len = array.arrays[2]    

From 19688709b3fa2ec76b33ed73744a91f14ee1b72c Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Mon, 21 Jul 2025 02:39:21 +0000
Subject: [PATCH 09/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregate_flox.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index b818bd75..21cbd111 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -345,6 +345,7 @@ def nanmean(group_idx, array, *, axis=-1, size=None, fill_value=None, dtype=None
         out /= nanlen(group_idx, array, size=size, axis=axis, fill_value=0)
     return out
 
+
 def ffill(group_idx, array, *, axis, **kwargs):
     group_idx, array, perm = _prepare_for_flox(group_idx, array)
     shape = array.shape

From 12bcb0f56296a2dac7835ed269d7dca68d36e081 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Mon, 21 Jul 2025 14:40:52 +1000
Subject: [PATCH 10/54] Remove more unnecessary comments

---
 flox/aggregations.py | 7 ++-----
 1 file changed, 2 insertions(+), 5 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index a9674757..e9bfb166 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -372,7 +372,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
     # Calculate sum squared deviations - the main part of variance sum
     array_means = (
         array_sums / array_lens
-    )  # Does this risk being run eagerly because it's not wrapped in anything?
+    )
 
     sum_squared_deviations = generic_aggregate(
         group_idx,
@@ -407,9 +407,6 @@ def clip_first(array):
 
     assert len(axis) == 1, "Assuming that the combine function is only in one direction at once"
 
-    # Does this double our memory footprint or are they just views?
-    # If there's a huge memory impact, probably better to copy paste array.arrays[1]
-    # in and accept the hit to readability
     sum_deviations, sum_X, sum_len = array.arrays
 
     # Calculate parts needed for cascading combination
@@ -440,7 +437,7 @@ def clip_first(array):
 
 
 def _var_finalize(multiarray, ddof=0):
-    return multiarray.arrays[0] / (multiarray.arrays[2] - ddof)  # Is this how ddof works again???
+    return multiarray.arrays[0] / (multiarray.arrays[2] - ddof)
 
 
 def _std_finalize(sumsq, sum_, count, ddof=0):

From b1f7b5d71b934669e44dd78ffa9120b7abaf87b3 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Mon, 21 Jul 2025 14:45:29 +1000
Subject: [PATCH 11/54] Remove _version.py

---
 flox/_version.py | 1 -
 1 file changed, 1 deletion(-)
 delete mode 100644 flox/_version.py

diff --git a/flox/_version.py b/flox/_version.py
deleted file mode 100644
index a76cf84b..00000000
--- a/flox/_version.py
+++ /dev/null
@@ -1 +0,0 @@
-__version__ = "0.1.dev657+g619a390.d20250606"

From cd9a8b83db27a1d9ae894a4ef37e98341115cb6a Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Mon, 21 Jul 2025 04:46:38 +0000
Subject: [PATCH 12/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregations.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 1f4c59ab..975c3258 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -370,9 +370,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
     )
 
     # Calculate sum squared deviations - the main part of variance sum
-    array_means = (
-        array_sums / array_lens
-    )
+    array_means = array_sums / array_lens
 
     sum_squared_deviations = generic_aggregate(
         group_idx,

From 27448e451c89aad1f307ae39f825060508822a38 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Thu, 31 Jul 2025 17:42:11 +1000
Subject: [PATCH 13/54] Add preliminary test for std/var precision

---
 tests/test_core.py | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/tests/test_core.py b/tests/test_core.py
index 863e552d..3926502e 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2240,3 +2240,25 @@ def test_sparse_nan_fill_value_reductions(chunks, fill_value, shape, func):
         expected = np.expand_dims(npfunc(numpy_array, axis=-1), axis=-1)
         actual, *_ = groupby_reduce(array, by, func=func, axis=-1)
     assert_equal(actual, expected)
+
+
+@pytest.mark.parametrize("func", ("nanvar","var")) # Expect to expand this to other functions once written. Putting var in to begin with bc I know it will fail
+@pytest.mark.parametrize("engine",("flox",)) # Expect to expand this to other engines once written
+@pytest.mark.parametrize("offset",(0,10e2,10e4,10e6,10e8,10e10,10e12)) # Should fail at 10e8 for old algorithm, and survive 10e12 for current
+def test_std_var_precision(func,engine,offset):
+    # Generate a dataset with small variance and big mean
+    # Check that func with engine gives you the same answer as numpy
+    
+    l =1000
+    array = np.linspace(-1,1,l) # has zero mean
+    labels = np.arange(l)%2 # Ideally we'd parametrize this too. 
+    
+    # These two need to be the same function, but with the offset added and not added
+    no_offset, _ = groupby_reduce(array, labels, engine=engine, func=func)
+    with_offset, _ = groupby_reduce(array+offset, labels, engine=engine, func=func)
+    
+    tol = {"rtol": 1e-8, "atol": 1e-10} # Not sure how stringent to be here
+    
+    # Failure threshold in my external tests is dependent on dask chunksize, maybe needs exploring better?
+    
+    assert_equal(no_offset, with_offset, tol)
\ No newline at end of file

From a81b1a3847f54ac8f4dca25aee35c86788c18766 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Thu, 31 Jul 2025 07:47:15 +0000
Subject: [PATCH 14/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 tests/test_core.py | 34 +++++++++++++++++++---------------
 1 file changed, 19 insertions(+), 15 deletions(-)

diff --git a/tests/test_core.py b/tests/test_core.py
index 3926502e..4f1e2856 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2242,23 +2242,27 @@ def test_sparse_nan_fill_value_reductions(chunks, fill_value, shape, func):
     assert_equal(actual, expected)
 
 
-@pytest.mark.parametrize("func", ("nanvar","var")) # Expect to expand this to other functions once written. Putting var in to begin with bc I know it will fail
-@pytest.mark.parametrize("engine",("flox",)) # Expect to expand this to other engines once written
-@pytest.mark.parametrize("offset",(0,10e2,10e4,10e6,10e8,10e10,10e12)) # Should fail at 10e8 for old algorithm, and survive 10e12 for current
-def test_std_var_precision(func,engine,offset):
+@pytest.mark.parametrize(
+    "func", ("nanvar", "var")
+)  # Expect to expand this to other functions once written. Putting var in to begin with bc I know it will fail
+@pytest.mark.parametrize("engine", ("flox",))  # Expect to expand this to other engines once written
+@pytest.mark.parametrize(
+    "offset", (0, 10e2, 10e4, 10e6, 10e8, 10e10, 10e12)
+)  # Should fail at 10e8 for old algorithm, and survive 10e12 for current
+def test_std_var_precision(func, engine, offset):
     # Generate a dataset with small variance and big mean
     # Check that func with engine gives you the same answer as numpy
-    
-    l =1000
-    array = np.linspace(-1,1,l) # has zero mean
-    labels = np.arange(l)%2 # Ideally we'd parametrize this too. 
-    
+
+    l = 1000
+    array = np.linspace(-1, 1, l)  # has zero mean
+    labels = np.arange(l) % 2  # Ideally we'd parametrize this too.
+
     # These two need to be the same function, but with the offset added and not added
     no_offset, _ = groupby_reduce(array, labels, engine=engine, func=func)
-    with_offset, _ = groupby_reduce(array+offset, labels, engine=engine, func=func)
-    
-    tol = {"rtol": 1e-8, "atol": 1e-10} # Not sure how stringent to be here
-    
+    with_offset, _ = groupby_reduce(array + offset, labels, engine=engine, func=func)
+
+    tol = {"rtol": 1e-8, "atol": 1e-10}  # Not sure how stringent to be here
+
     # Failure threshold in my external tests is dependent on dask chunksize, maybe needs exploring better?
-    
-    assert_equal(no_offset, with_offset, tol)
\ No newline at end of file
+
+    assert_equal(no_offset, with_offset, tol)

From 004fddcc88e169a369e4505e7e9cdcac3f80dd39 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Thu, 31 Jul 2025 17:56:31 +1000
Subject: [PATCH 15/54] Correct comment

---
 tests/test_core.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_core.py b/tests/test_core.py
index 3926502e..623c6ae2 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2242,7 +2242,7 @@ def test_sparse_nan_fill_value_reductions(chunks, fill_value, shape, func):
     assert_equal(actual, expected)
 
 
-@pytest.mark.parametrize("func", ("nanvar","var")) # Expect to expand this to other functions once written. Putting var in to begin with bc I know it will fail
+@pytest.mark.parametrize("func", ("nanvar","var")) # Expect to expand this to other functions once written. "nanvar" has updated chunk, combine functions. "var", for the moment, still uses the old algorithm
 @pytest.mark.parametrize("engine",("flox",)) # Expect to expand this to other engines once written
 @pytest.mark.parametrize("offset",(0,10e2,10e4,10e6,10e8,10e10,10e12)) # Should fail at 10e8 for old algorithm, and survive 10e12 for current
 def test_std_var_precision(func,engine,offset):

From c3a6d88b7b346bf5c5f36b62925679b8374c7eae Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Tue, 5 Aug 2025 11:25:29 +1000
Subject: [PATCH 16/54] Update flox/aggregate_flox.py

Co-authored-by: Deepak Cherian <dcherian@users.noreply.github.com>
---
 flox/aggregate_flox.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index 7e825e7a..e7245aec 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -18,10 +18,7 @@ def __init__(self, arrays):
         assert all(arrays[0].shape == a.shape for a in arrays), "Expect all arrays to have the same shape"
 
     def astype(self, dt, **kwargs):
-        new_arrays = []  # I really don't like doing this as a list
-        for array in self.arrays:  # Do we care about trying to avoid for loops here? three separate lines would be faster, but harder to read
-            new_arrays.append(array.astype(dt, **kwargs))
-        return MultiArray(new_arrays)
+        return MultiArray(tuple(array.astype(dt, **kwargs) for array in self.arrays))
 
     def reshape(self, shape, **kwargs):
         return MultiArray([array.reshape(shape, **kwargs) for array in self.arrays])

From 4dcd7c28081b6b929815790ba163cff6e2a8bcd0 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Tue, 5 Aug 2025 18:12:12 +1000
Subject: [PATCH 17/54] Replace some list comprehension with tuple

---
 flox/aggregate_flox.py | 19 ++++++-------------
 1 file changed, 6 insertions(+), 13 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index e7245aec..4179668c 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -21,10 +21,10 @@ def astype(self, dt, **kwargs):
         return MultiArray(tuple(array.astype(dt, **kwargs) for array in self.arrays))
 
     def reshape(self, shape, **kwargs):
-        return MultiArray([array.reshape(shape, **kwargs) for array in self.arrays])
+        return MultiArray(tuple(array.reshape(shape, **kwargs) for array in self.arrays))
 
     def squeeze(self, axis=None):
-        return MultiArray([array.squeeze(axis) for array in self.arrays])
+        return MultiArray(tuple(array.squeeze(axis) for array in self.arrays))
 
     def __array_function__(self, func, types, args, kwargs):
         if func not in MULTIARRAY_HANDLED_FUNCTIONS:
@@ -66,8 +66,8 @@ def decorator(func):
 @implements(np.expand_dims)
 def expand_dims_MultiArray(multiarray, axis):
     return MultiArray(
-        [np.expand_dims(a, axis) for a in multiarray.arrays]
-    )  # This is gonna spit out a list and I'm not sure if I'm okay with that?
+        tuple(np.expand_dims(a, axis) for a in multiarray.arrays)
+    )
 
 
 @implements(np.concatenate)
@@ -81,15 +81,8 @@ def concatenate_MultiArray(multiarrays, axis):
 
     # There's the potential for problematic different shapes coming in here.
     # Probably warrants some defensive programming, but I'm not sure what to check for while still being generic
-
-    # I don't like using append and lists here, but I can't work out how to do it better
-    new_arrays = []
-    for i in range(multiarrays[0].ndim):
-        new_arrays.append(np.concatenate([ma.arrays[i] for ma in multiarrays], axis))
-
-    out = MultiArray(new_arrays)
-    return out
-
+    
+    return MultiArray(tuple(np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis) for i in range(multiarrays[0].ndim))) # Is this readable?
 
 @implements(np.transpose)
 def transpose_MultiArray(multiarray, axes):

From c101a2bee10763afad6b023b42770301242c371d Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Tue, 5 Aug 2025 08:13:20 +0000
Subject: [PATCH 18/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregate_flox.py | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index 4179668c..062c6415 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -65,9 +65,7 @@ def decorator(func):
 
 @implements(np.expand_dims)
 def expand_dims_MultiArray(multiarray, axis):
-    return MultiArray(
-        tuple(np.expand_dims(a, axis) for a in multiarray.arrays)
-    )
+    return MultiArray(tuple(np.expand_dims(a, axis) for a in multiarray.arrays))
 
 
 @implements(np.concatenate)
@@ -81,8 +79,14 @@ def concatenate_MultiArray(multiarrays, axis):
 
     # There's the potential for problematic different shapes coming in here.
     # Probably warrants some defensive programming, but I'm not sure what to check for while still being generic
-    
-    return MultiArray(tuple(np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis) for i in range(multiarrays[0].ndim))) # Is this readable?
+
+    return MultiArray(
+        tuple(
+            np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis)
+            for i in range(multiarrays[0].ndim)
+        )
+    )  # Is this readable?
+
 
 @implements(np.transpose)
 def transpose_MultiArray(multiarray, axes):

From 98e1b4ec0b4206fb2a0246d8b575bc7d074edf41 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 5 Aug 2025 07:19:58 -0600
Subject: [PATCH 19/54] Fixes

---
 flox/aggregations.py |  3 ++-
 flox/core.py         |  4 +++-
 tests/test_core.py   | 14 ++++++++++----
 3 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 975c3258..54ab23c4 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -10,6 +10,7 @@
 
 import numpy as np
 import pandas as pd
+import toolz as tlz
 from numpy.typing import ArrayLike, DTypeLike
 
 from . import aggregate_flox, aggregate_npg, xrutils
@@ -466,7 +467,7 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
 nanvar = Aggregation(
     "nanvar",
     chunk=var_chunk,
-    numpy="nanvar",
+    numpy=tlz.compose(_var_finalize, var_chunk),
     combine=(_var_combine,),
     finalize=_var_finalize,
     fill_value=0,
diff --git a/flox/core.py b/flox/core.py
index 8200cb97..259fedbf 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -1300,7 +1300,9 @@ def chunk_reduce(
             kw_func.update(kw)
 
             # UGLY! but this is because the `var` breaks our design assumptions
-            if reduction is var_chunk:
+            if reduction is var_chunk or (
+                isinstance(reduction, tlz.functoolz.Compose) and reduction.first is var_chunk
+            ):
                 kw_func.update(engine=engine)
 
             if callable(reduction):
diff --git a/tests/test_core.py b/tests/test_core.py
index ef98ec04..cb021b5a 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2253,16 +2253,22 @@ def test_std_var_precision(func, engine, offset):
     # Generate a dataset with small variance and big mean
     # Check that func with engine gives you the same answer as numpy
 
-    l = 1000
-    array = np.linspace(-1, 1, l)  # has zero mean
-    labels = np.arange(l) % 2  # Ideally we'd parametrize this too.
+    size = 1000
+    array = np.linspace(-1, 1, size)  # has zero mean
+    labels = np.arange(size) % 2  # Ideally we'd parametrize this too.
 
     # These two need to be the same function, but with the offset added and not added
     no_offset, _ = groupby_reduce(array, labels, engine=engine, func=func)
     with_offset, _ = groupby_reduce(array + offset, labels, engine=engine, func=func)
 
+    expected = np.concatenate([np.nanvar(array[::2], keepdims=True), np.nanvar(array[1::2], keepdims=True)])
+    expected_offset = np.concatenate(
+        [np.nanvar(array[::2] + offset, keepdims=True), np.nanvar(array[1::2] + offset, keepdims=True)]
+    )
+
     tol = {"rtol": 1e-8, "atol": 1e-10}  # Not sure how stringent to be here
 
+    assert_equal(expected, no_offset, tol)
+    assert_equal(expected_offset, with_offset, tol)
     # Failure threshold in my external tests is dependent on dask chunksize, maybe needs exploring better?
-
     assert_equal(no_offset, with_offset, tol)

From d0d09df2e499776cbc884b91589fd3954b3378f5 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 5 Aug 2025 09:45:10 -0600
Subject: [PATCH 20/54] minor edit for neater test reports.

---
 tests/test_core.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tests/test_core.py b/tests/test_core.py
index cb021b5a..9f885d87 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2247,13 +2247,14 @@ def test_sparse_nan_fill_value_reductions(chunks, fill_value, shape, func):
 )  # Expect to expand this to other functions once written. "nanvar" has updated chunk, combine functions. "var", for the moment, still uses the old algorithm
 @pytest.mark.parametrize("engine", ("flox",))  # Expect to expand this to other engines once written
 @pytest.mark.parametrize(
-    "offset", (0, 10e2, 10e4, 10e6, 10e8, 10e10, 10e12)
+    "exponent", (10, 12)
 )  # Should fail at 10e8 for old algorithm, and survive 10e12 for current
-def test_std_var_precision(func, engine, offset):
+def test_std_var_precision(func, exponent, engine):
     # Generate a dataset with small variance and big mean
     # Check that func with engine gives you the same answer as numpy
 
     size = 1000
+    offset = 10**exponent
     array = np.linspace(-1, 1, size)  # has zero mean
     labels = np.arange(size) % 2  # Ideally we'd parametrize this too.
 

From 1139a9ccf90064f15e7343a09cbfa4e0530b31f4 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 6 Aug 2025 08:29:34 +1000
Subject: [PATCH 21/54] Fix another list/tuple comprehension

---
 flox/aggregate_flox.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index 062c6415..c3404a2f 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -91,8 +91,8 @@ def concatenate_MultiArray(multiarrays, axis):
 @implements(np.transpose)
 def transpose_MultiArray(multiarray, axes):
     return MultiArray(
-        [np.transpose(a, axes) for a in multiarray.arrays]
-    )  # This is gonna spit out a list and I'm not sure if I'm okay with that?
+        tuple(np.transpose(a, axes) for a in multiarray.arrays)
+    )
 
 
 def _prepare_for_flox(group_idx, array):

From 569629c92b96b7faa8f94d1495b51f8d4323aab6 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 6 Aug 2025 08:57:06 +1000
Subject: [PATCH 22/54] implement np.full

---
 flox/aggregate_flox.py | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index c3404a2f..253d36df 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -94,6 +94,20 @@ def transpose_MultiArray(multiarray, axes):
         tuple(np.transpose(a, axes) for a in multiarray.arrays)
     )
 
+@implements(np.full)
+def full_MultiArray(shape, fill_values, *args, **kwargs): # I've used *args, **kwargs instead of the full argument list to give us more flexibility if numpy changes stuff https://numpy.org/doc/stable/reference/generated/numpy.full.html
+    ''' All arguments except fill_value are shared by each array
+    in the MultiArray.
+    Iterate over fill_values to create arrays
+    '''
+    return MultiArray(
+        tuple(
+            np.full(shape,fv,*args,**kwargs) # I'm 90% sure I've used *args, **kwargs correctly here -- could you double-check?
+            for fv in fill_values
+        )
+    )
+
+
 
 def _prepare_for_flox(group_idx, array):
     """

From 50ad095d3dd39fd7025a49532cf8d1c05ec80784 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 6 Aug 2025 10:06:08 +1000
Subject: [PATCH 23/54] Implement np.full and empty chunks in var_chunk

---
 flox/aggregations.py | 31 ++++++++++++++++++++-----------
 1 file changed, 20 insertions(+), 11 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 54ab23c4..652dd08a 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -355,7 +355,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value,
+        fill_value=fill_value[2], # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -366,7 +366,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value,
+        fill_value=fill_value[1], # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -380,7 +380,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value,
+        fill_value=fill_value[0], # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -388,34 +388,43 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
 
 
 def _var_combine(array, axis, keepdims=True):
-    def clip_last(array):
+    def clip_last(array,n=1):
         """Return array except the last element along axis
         Purely included to tidy up the adj_terms line
         """
+        assert n>0, "Clipping nothing off the end isn't implemented"
         not_last = [slice(None, None) for i in range(array.ndim)]
-        not_last[axis[0]] = slice(None, -1)
+        not_last[axis[0]] = slice(None, -n)
         return array[*not_last]
 
-    def clip_first(array):
+    def clip_first(array,n=1):
         """Return array except the first element along axis
         Purely included to tidy up the adj_terms line
         """
         not_first = [slice(None, None) for i in range(array.ndim)]
-        not_first[axis[0]] = slice(1, None)
+        not_first[axis[0]] = slice(n, None)
         return array[*not_first]
 
     assert len(axis) == 1, "Assuming that the combine function is only in one direction at once"
 
     sum_deviations, sum_X, sum_len = array.arrays
 
-    # Calculate parts needed for cascading combination
+    # Calculate parts needed for cascading combination 
     cumsum_X = np.cumsum(sum_X, axis=axis[0])  # Don't need to be able to merge the last element
     cumsum_len = np.cumsum(sum_len, axis=axis[0])
-
+    
+    # There will be instances in which one or both chunks being merged are empty
+    # In which case, the adjustment term should be zero, but will throw a divide-by-zero error
+    # We're going to add a constant to the bottom of the adjustment term equation on those instances
+    # and count on the zeros on the top making our adjustment term still zero
+    zero_denominator = ((clip_last(cumsum_len)==0) | (clip_first(sum_len)==0))
+    
     # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
     adj_terms = (
         clip_last(cumsum_len) * clip_first(sum_X) - clip_first(sum_len) * clip_last(cumsum_X)
-    ) ** 2 / (clip_last(cumsum_len) * clip_first(sum_len) * (clip_last(cumsum_len) + clip_first(sum_len)))
+    ) ** 2 / (clip_last(cumsum_len) * clip_first(sum_len) * (clip_last(cumsum_len) + clip_first(sum_len))+zero_denominator.astype(int))
+    
+    assert np.all((adj_terms*zero_denominator) == 0), "Instances where we add something to the denominator must come out to zero"
 
     return aggregate_flox.MultiArray(
         (
@@ -470,7 +479,7 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
     numpy=tlz.compose(_var_finalize, var_chunk),
     combine=(_var_combine,),
     finalize=_var_finalize,
-    fill_value=0,
+    fill_value=((0,0,0),), # DIVIDE BY ZERO ERROR! NOOOO!!!
     final_fill_value=np.nan,
     dtypes=(None,),
     final_dtype=np.floating,

From f88e231e435239e6b045472e14cc6285c1a24b48 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Wed, 6 Aug 2025 00:06:23 +0000
Subject: [PATCH 24/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregate_flox.py | 18 ++++++++++--------
 flox/aggregations.py   | 33 +++++++++++++++++++--------------
 2 files changed, 29 insertions(+), 22 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index 253d36df..194991df 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -90,25 +90,27 @@ def concatenate_MultiArray(multiarrays, axis):
 
 @implements(np.transpose)
 def transpose_MultiArray(multiarray, axes):
-    return MultiArray(
-        tuple(np.transpose(a, axes) for a in multiarray.arrays)
-    )
+    return MultiArray(tuple(np.transpose(a, axes) for a in multiarray.arrays))
+
 
 @implements(np.full)
-def full_MultiArray(shape, fill_values, *args, **kwargs): # I've used *args, **kwargs instead of the full argument list to give us more flexibility if numpy changes stuff https://numpy.org/doc/stable/reference/generated/numpy.full.html
-    ''' All arguments except fill_value are shared by each array
+def full_MultiArray(
+    shape, fill_values, *args, **kwargs
+):  # I've used *args, **kwargs instead of the full argument list to give us more flexibility if numpy changes stuff https://numpy.org/doc/stable/reference/generated/numpy.full.html
+    """All arguments except fill_value are shared by each array
     in the MultiArray.
     Iterate over fill_values to create arrays
-    '''
+    """
     return MultiArray(
         tuple(
-            np.full(shape,fv,*args,**kwargs) # I'm 90% sure I've used *args, **kwargs correctly here -- could you double-check?
+            np.full(
+                shape, fv, *args, **kwargs
+            )  # I'm 90% sure I've used *args, **kwargs correctly here -- could you double-check?
             for fv in fill_values
         )
     )
 
 
-
 def _prepare_for_flox(group_idx, array):
     """
     Sort the input array once to save time.
diff --git a/flox/aggregations.py b/flox/aggregations.py
index 652dd08a..61d1436c 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -355,7 +355,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value[2], # Unpack fill value bc it's currently defined for multiarray
+        fill_value=fill_value[2],  # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -366,7 +366,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value[1], # Unpack fill value bc it's currently defined for multiarray
+        fill_value=fill_value[1],  # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -380,7 +380,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value[0], # Unpack fill value bc it's currently defined for multiarray
+        fill_value=fill_value[0],  # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -388,16 +388,16 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
 
 
 def _var_combine(array, axis, keepdims=True):
-    def clip_last(array,n=1):
+    def clip_last(array, n=1):
         """Return array except the last element along axis
         Purely included to tidy up the adj_terms line
         """
-        assert n>0, "Clipping nothing off the end isn't implemented"
+        assert n > 0, "Clipping nothing off the end isn't implemented"
         not_last = [slice(None, None) for i in range(array.ndim)]
         not_last[axis[0]] = slice(None, -n)
         return array[*not_last]
 
-    def clip_first(array,n=1):
+    def clip_first(array, n=1):
         """Return array except the first element along axis
         Purely included to tidy up the adj_terms line
         """
@@ -409,22 +409,27 @@ def clip_first(array,n=1):
 
     sum_deviations, sum_X, sum_len = array.arrays
 
-    # Calculate parts needed for cascading combination 
+    # Calculate parts needed for cascading combination
     cumsum_X = np.cumsum(sum_X, axis=axis[0])  # Don't need to be able to merge the last element
     cumsum_len = np.cumsum(sum_len, axis=axis[0])
-    
+
     # There will be instances in which one or both chunks being merged are empty
     # In which case, the adjustment term should be zero, but will throw a divide-by-zero error
     # We're going to add a constant to the bottom of the adjustment term equation on those instances
     # and count on the zeros on the top making our adjustment term still zero
-    zero_denominator = ((clip_last(cumsum_len)==0) | (clip_first(sum_len)==0))
-    
+    zero_denominator = (clip_last(cumsum_len) == 0) | (clip_first(sum_len) == 0)
+
     # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
     adj_terms = (
         clip_last(cumsum_len) * clip_first(sum_X) - clip_first(sum_len) * clip_last(cumsum_X)
-    ) ** 2 / (clip_last(cumsum_len) * clip_first(sum_len) * (clip_last(cumsum_len) + clip_first(sum_len))+zero_denominator.astype(int))
-    
-    assert np.all((adj_terms*zero_denominator) == 0), "Instances where we add something to the denominator must come out to zero"
+    ) ** 2 / (
+        clip_last(cumsum_len) * clip_first(sum_len) * (clip_last(cumsum_len) + clip_first(sum_len))
+        + zero_denominator.astype(int)
+    )
+
+    assert np.all((adj_terms * zero_denominator) == 0), (
+        "Instances where we add something to the denominator must come out to zero"
+    )
 
     return aggregate_flox.MultiArray(
         (
@@ -479,7 +484,7 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
     numpy=tlz.compose(_var_finalize, var_chunk),
     combine=(_var_combine,),
     finalize=_var_finalize,
-    fill_value=((0,0,0),), # DIVIDE BY ZERO ERROR! NOOOO!!!
+    fill_value=((0, 0, 0),),  # DIVIDE BY ZERO ERROR! NOOOO!!!
     final_fill_value=np.nan,
     dtypes=(None,),
     final_dtype=np.floating,

From 77526fd608227dabbc1139e4da7896085ac0adc3 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 6 Aug 2025 10:20:01 +1000
Subject: [PATCH 25/54] update comment

---
 flox/aggregations.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 652dd08a..a8738346 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -479,7 +479,7 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
     numpy=tlz.compose(_var_finalize, var_chunk),
     combine=(_var_combine,),
     finalize=_var_finalize,
-    fill_value=((0,0,0),), # DIVIDE BY ZERO ERROR! NOOOO!!!
+    fill_value=((0,0,0),),
     final_fill_value=np.nan,
     dtypes=(None,),
     final_dtype=np.floating,

From 31f30c947f9d1be53f42af3e962cf71da19ca246 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Wed, 6 Aug 2025 00:24:40 +0000
Subject: [PATCH 26/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregations.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 567a43e3..35e41bdd 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -484,7 +484,7 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
     numpy=tlz.compose(_var_finalize, var_chunk),
     combine=(_var_combine,),
     finalize=_var_finalize,
-    fill_value=((0, 0, 0),), 
+    fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
     dtypes=(None,),
     final_dtype=np.floating,

From 3b3369f2a840737c2b815fbf31cc31f90a962a65 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 21:06:06 -0600
Subject: [PATCH 27/54] edits

---
 flox/aggregate_flox.py | 21 ++++++++-------------
 flox/aggregations.py   | 20 ++++++++++++++------
 flox/core.py           |  5 ++---
 flox/xrutils.py        |  6 ++++++
 tests/test_core.py     |  2 +-
 5 files changed, 31 insertions(+), 23 deletions(-)

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index 194991df..5e3a64ee 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -26,6 +26,11 @@ def reshape(self, shape, **kwargs):
     def squeeze(self, axis=None):
         return MultiArray(tuple(array.squeeze(axis) for array in self.arrays))
 
+    def __setitem__(self, key, value):
+        assert len(value) == len(self.arrays)
+        for array, val in zip(self.arrays, value):
+            array[key] = val
+
     def __array_function__(self, func, types, args, kwargs):
         if func not in MULTIARRAY_HANDLED_FUNCTIONS:
             return NotImplemented
@@ -72,20 +77,10 @@ def expand_dims_MultiArray(multiarray, axis):
 def concatenate_MultiArray(multiarrays, axis):
     n_arrays = len(multiarrays[0].arrays)
     for ma in multiarrays[1:]:
-        if not (
-            len(ma.arrays) == n_arrays
-        ):  # I don't know what trying to concatenate MultiArrays with different numbers of arrays would even mean
-            raise NotImplementedError
-
-    # There's the potential for problematic different shapes coming in here.
-    # Probably warrants some defensive programming, but I'm not sure what to check for while still being generic
-
+        assert len(ma.arrays) == n_arrays
     return MultiArray(
-        tuple(
-            np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis)
-            for i in range(multiarrays[0].ndim)
-        )
-    )  # Is this readable?
+        tuple(np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis) for i in range(n_arrays))
+    )
 
 
 @implements(np.transpose)
diff --git a/flox/aggregations.py b/flox/aggregations.py
index 35e41bdd..13257a04 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -10,7 +10,6 @@
 
 import numpy as np
 import pandas as pd
-import toolz as tlz
 from numpy.typing import ArrayLike, DTypeLike
 
 from . import aggregate_flox, aggregate_npg, xrutils
@@ -355,7 +354,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value[2],  # Unpack fill value bc it's currently defined for multiarray
+        fill_value=0,  # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -366,7 +365,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value[1],  # Unpack fill value bc it's currently defined for multiarray
+        fill_value=0,  # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -380,7 +379,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
         engine=engine,
         axis=axis,
         size=size,
-        fill_value=fill_value[0],  # Unpack fill value bc it's currently defined for multiarray
+        fill_value=0,  # Unpack fill value bc it's currently defined for multiarray
         dtype=dtype,
     )
 
@@ -450,7 +449,10 @@ def clip_first(array, n=1):
 
 
 def _var_finalize(multiarray, ddof=0):
-    return multiarray.arrays[0] / (multiarray.arrays[2] - ddof)
+    den = multiarray.arrays[2] - ddof
+    # preserve nans for groups with 0 obs; so these values are -ddof
+    den[den < 0] = 0
+    return multiarray.arrays[0] / den
 
 
 def _std_finalize(sumsq, sum_, count, ddof=0):
@@ -478,10 +480,16 @@ def _std_finalize(sumsq, sum_, count, ddof=0):
 # dtypes=(None, None, np.intp),
 # final_dtype=np.floating,
 # )
+
+
+def blockwise_or_numpy_var(*args, ddof=0, **kwargs):
+    return _var_finalize(var_chunk(*args, **kwargs), ddof)
+
+
 nanvar = Aggregation(
     "nanvar",
     chunk=var_chunk,
-    numpy=tlz.compose(_var_finalize, var_chunk),
+    numpy=blockwise_or_numpy_var,
     combine=(_var_combine,),
     finalize=_var_finalize,
     fill_value=((0, 0, 0),),
diff --git a/flox/core.py b/flox/core.py
index 259fedbf..5547a9af 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -43,6 +43,7 @@
     ScanState,
     _atleast_1d,
     _initialize_aggregation,
+    blockwise_or_numpy_var,
     generic_aggregate,
     quantile_new_dims_func,
     var_chunk,
@@ -1300,9 +1301,7 @@ def chunk_reduce(
             kw_func.update(kw)
 
             # UGLY! but this is because the `var` breaks our design assumptions
-            if reduction is var_chunk or (
-                isinstance(reduction, tlz.functoolz.Compose) and reduction.first is var_chunk
-            ):
+            if reduction is var_chunk or blockwise_or_numpy_var:
                 kw_func.update(engine=engine)
 
             if callable(reduction):
diff --git a/flox/xrutils.py b/flox/xrutils.py
index 37e18567..9a839b46 100644
--- a/flox/xrutils.py
+++ b/flox/xrutils.py
@@ -146,6 +146,9 @@ def is_scalar(value: Any, include_0d: bool = True) -> bool:
 
 
 def notnull(data):
+    if isinstance(data, tuple) and len(data) == 3 and data == (0, 0, 0):
+        # boo: another special case for Var
+        return True
     if not is_duck_array(data):
         data = np.asarray(data)
 
@@ -163,6 +166,9 @@ def notnull(data):
 
 
 def isnull(data: Any):
+    if isinstance(data, tuple) and len(data) == 3 and data == (0, 0, 0):
+        # boo: another special case for Var
+        return False
     if data is None:
         return False
     if not is_duck_array(data):
diff --git a/tests/test_core.py b/tests/test_core.py
index 9f885d87..ee7bfcc9 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2247,7 +2247,7 @@ def test_sparse_nan_fill_value_reductions(chunks, fill_value, shape, func):
 )  # Expect to expand this to other functions once written. "nanvar" has updated chunk, combine functions. "var", for the moment, still uses the old algorithm
 @pytest.mark.parametrize("engine", ("flox",))  # Expect to expand this to other engines once written
 @pytest.mark.parametrize(
-    "exponent", (10, 12)
+    "exponent", (2, 4, 6, 8, 10, 12)
 )  # Should fail at 10e8 for old algorithm, and survive 10e12 for current
 def test_std_var_precision(func, exponent, engine):
     # Generate a dataset with small variance and big mean

From 24fb5320f1e934655ceb0d79dd61e7a9833a305d Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 21:31:04 -0600
Subject: [PATCH 28/54] support var, std

---
 flox/aggregations.py | 70 +++++++++++++++++++++++---------------------
 flox/core.py         |  7 ++---
 tests/test_core.py   |  2 +-
 3 files changed, 40 insertions(+), 39 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 13257a04..09649e41 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -343,7 +343,9 @@ def _mean_finalize(sum_, count):
 )
 
 
-def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=None, dtype=None):
+def var_chunk(
+    group_idx, array, *, skipna: bool, engine: str, axis=-1, size=None, fill_value=None, dtype=None
+):
     from .aggregate_flox import MultiArray
 
     # Calculate length and sum - important for the adjustment terms to sum squared deviations
@@ -361,7 +363,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
     array_sums = generic_aggregate(
         group_idx,
         array,
-        func="nansum",
+        func="nansum" if skipna else "sum",
         engine=engine,
         axis=axis,
         size=size,
@@ -375,7 +377,7 @@ def var_chunk(group_idx, array, *, engine: str, axis=-1, size=None, fill_value=N
     sum_squared_deviations = generic_aggregate(
         group_idx,
         (array - array_means[..., group_idx]) ** 2,
-        func="nansum",
+        func="nansum" if skipna else "sum",
         engine=engine,
         axis=axis,
         size=size,
@@ -448,6 +450,12 @@ def clip_first(array, n=1):
 # return result
 
 
+def is_var_chunk_reduction(agg: Callable) -> bool:
+    if isinstance(agg, partial):
+        agg = agg.func
+    return agg is blockwise_or_numpy_var or agg is var_chunk
+
+
 def _var_finalize(multiarray, ddof=0):
     den = multiarray.arrays[2] - ddof
     # preserve nans for groups with 0 obs; so these values are -ddof
@@ -455,41 +463,32 @@ def _var_finalize(multiarray, ddof=0):
     return multiarray.arrays[0] / den
 
 
-def _std_finalize(sumsq, sum_, count, ddof=0):
-    return np.sqrt(_var_finalize(sumsq, sum_, count, ddof))
+def _std_finalize(multiarray, ddof=0):
+    return np.sqrt(_var_finalize(multiarray, ddof))
+
+
+def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
+    res = _var_finalize(var_chunk(*args, skipna=skipna, **kwargs), ddof)
+    return np.sqrt(res) if std else res
 
 
 # var, std always promote to float, so we set nan
 var = Aggregation(
     "var",
-    chunk=("sum_of_squares", "sum", "nanlen"),
-    combine=("sum", "sum", "sum"),
+    chunk=partial(var_chunk, skipna=False),
+    numpy=partial(blockwise_or_numpy_var, skipna=False),
+    combine=(_var_combine,),
     finalize=_var_finalize,
-    fill_value=0,
+    fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(None, None, np.intp),
+    dtypes=(None,),
     final_dtype=np.floating,
 )
-# nanvar = Aggregation(
-# "nanvar",
-# chunk=("nansum_of_squares", "nansum", "nanlen"),
-# combine=("sum", "sum", "sum"),
-# finalize=_var_finalize,
-# fill_value=0,
-# final_fill_value=np.nan,
-# dtypes=(None, None, np.intp),
-# final_dtype=np.floating,
-# )
-
-
-def blockwise_or_numpy_var(*args, ddof=0, **kwargs):
-    return _var_finalize(var_chunk(*args, **kwargs), ddof)
-
 
 nanvar = Aggregation(
     "nanvar",
-    chunk=var_chunk,
-    numpy=blockwise_or_numpy_var,
+    chunk=partial(var_chunk, skipna=True),
+    numpy=partial(blockwise_or_numpy_var, skipna=True),
     combine=(_var_combine,),
     finalize=_var_finalize,
     fill_value=((0, 0, 0),),
@@ -497,24 +496,27 @@ def blockwise_or_numpy_var(*args, ddof=0, **kwargs):
     dtypes=(None,),
     final_dtype=np.floating,
 )
+
 std = Aggregation(
     "std",
-    chunk=("sum_of_squares", "sum", "nanlen"),
-    combine=("sum", "sum", "sum"),
+    chunk=partial(var_chunk, skipna=False),
+    numpy=partial(blockwise_or_numpy_var, skipna=False, std=True),
+    combine=(_var_combine,),
     finalize=_std_finalize,
-    fill_value=0,
+    fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(None, None, np.intp),
+    dtypes=(None,),
     final_dtype=np.floating,
 )
 nanstd = Aggregation(
     "nanstd",
-    chunk=("nansum_of_squares", "nansum", "nanlen"),
-    combine=("sum", "sum", "sum"),
+    chunk=partial(var_chunk, skipna=True),
+    numpy=partial(blockwise_or_numpy_var, skipna=True, std=True),
+    combine=(_var_combine,),
     finalize=_std_finalize,
-    fill_value=0,
+    fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(None, None, np.intp),
+    dtypes=(None,),
     final_dtype=np.floating,
 )
 
diff --git a/flox/core.py b/flox/core.py
index 5547a9af..d5cde638 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -43,10 +43,9 @@
     ScanState,
     _atleast_1d,
     _initialize_aggregation,
-    blockwise_or_numpy_var,
     generic_aggregate,
+    is_var_chunk_reduction,
     quantile_new_dims_func,
-    var_chunk,
 )
 from .cache import memoize
 from .lib import ArrayLayer, dask_array_type, sparse_array_type
@@ -1291,7 +1290,7 @@ def chunk_reduce(
     previous_reduction: T_Func = ""
     for reduction, fv, kw, dt in zip(funcs, fill_values, kwargss, dtypes):
         # UGLY! but this is because the `var` breaks our design assumptions
-        if empty and reduction is not var_chunk:
+        if empty and not is_var_chunk_reduction(reduction):
             result = np.full(shape=final_array_shape, fill_value=fv, like=array)
         elif is_nanlen(reduction) and is_nanlen(previous_reduction):
             result = results["intermediates"][-1]
@@ -1301,7 +1300,7 @@ def chunk_reduce(
             kw_func.update(kw)
 
             # UGLY! but this is because the `var` breaks our design assumptions
-            if reduction is var_chunk or blockwise_or_numpy_var:
+            if is_var_chunk_reduction(reduction):
                 kw_func.update(engine=engine)
 
             if callable(reduction):
diff --git a/tests/test_core.py b/tests/test_core.py
index ee7bfcc9..5620be30 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -236,7 +236,7 @@ def gen_array_by(size, func):
 @pytest.mark.parametrize("size", [(1, 12), (12,), (12, 9)])
 @pytest.mark.parametrize("nby", [1, 2, 3])
 @pytest.mark.parametrize("add_nan_by", [True, False])
-@pytest.mark.parametrize("func", ["nanvar"])
+@pytest.mark.parametrize("func", ["var", "nanvar", "std", "nanstd"])
 def test_groupby_reduce_all(to_sparse, nby, size, chunks, func, add_nan_by, engine):
     if ("arg" in func and engine in ["flox", "numbagg"]) or (func in BLOCKWISE_FUNCS and chunks != -1):
         pytest.skip()

From 177b8de8e66bb85ba2d128f960fce69bae5a6b01 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 21:41:02 -0600
Subject: [PATCH 29/54] enable property tests

---
 tests/strategies.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/strategies.py b/tests/strategies.py
index 76102047..ea9c2ed7 100644
--- a/tests/strategies.py
+++ b/tests/strategies.py
@@ -108,9 +108,8 @@ def insert_nans(draw: st.DrawFn, array: np.ndarray) -> np.ndarray:
     "any",
     "all",
 ] + list(SCIPY_STATS_FUNCS)
-SKIPPED_FUNCS = ["var", "std", "nanvar", "nanstd"]
 
-func_st = st.sampled_from([f for f in ALL_FUNCS if f not in NON_NUMPY_FUNCS and f not in SKIPPED_FUNCS])
+func_st = st.sampled_from([f for f in ALL_FUNCS if f not in NON_NUMPY_FUNCS])
 
 
 @st.composite

From 7deb84a20dd567ed2aefef12ed273648a68700f5 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 21:43:02 -0600
Subject: [PATCH 30/54] cleanup

---
 flox/aggregate_flox.py | 100 -----------------------------------------
 flox/aggregations.py   |  15 ++-----
 flox/core.py           |   2 +-
 flox/multiarray.py     |  91 +++++++++++++++++++++++++++++++++++++
 tests/test_core.py     |  13 +++---
 5 files changed, 101 insertions(+), 120 deletions(-)
 create mode 100644 flox/multiarray.py

diff --git a/flox/aggregate_flox.py b/flox/aggregate_flox.py
index 5e3a64ee..12750645 100644
--- a/flox/aggregate_flox.py
+++ b/flox/aggregate_flox.py
@@ -1,110 +1,10 @@
 from functools import partial
-from typing import Self
 
 import numpy as np
 
 from . import xrdtypes as dtypes
 from .xrutils import is_scalar, isnull, notnull
 
-MULTIARRAY_HANDLED_FUNCTIONS = {}
-
-
-class MultiArray:
-    arrays: tuple[np.ndarray, ...]
-
-    def __init__(self, arrays):
-        self.arrays = arrays  # something else needed here to be more careful about types (not sure what)
-        # Do we want to co-erce arrays into a tuple and make sure it's immutable? Do we want it to be immutable?
-        assert all(arrays[0].shape == a.shape for a in arrays), "Expect all arrays to have the same shape"
-
-    def astype(self, dt, **kwargs):
-        return MultiArray(tuple(array.astype(dt, **kwargs) for array in self.arrays))
-
-    def reshape(self, shape, **kwargs):
-        return MultiArray(tuple(array.reshape(shape, **kwargs) for array in self.arrays))
-
-    def squeeze(self, axis=None):
-        return MultiArray(tuple(array.squeeze(axis) for array in self.arrays))
-
-    def __setitem__(self, key, value):
-        assert len(value) == len(self.arrays)
-        for array, val in zip(self.arrays, value):
-            array[key] = val
-
-    def __array_function__(self, func, types, args, kwargs):
-        if func not in MULTIARRAY_HANDLED_FUNCTIONS:
-            return NotImplemented
-        # Note: this allows subclasses that don't override
-        # __array_function__ to handle MyArray objects
-        # if not all(issubclass(t, MyArray) for t in types): # I can't see this being relevant at all for this code, but maybe it's safer to leave it in?
-        # return NotImplemented
-        return MULTIARRAY_HANDLED_FUNCTIONS[func](*args, **kwargs)
-
-    # Shape is needed, seems likely that the other two might be
-    # Making some strong assumptions here that all the arrays are the same shape, and I don't really like this
-    @property
-    def dtype(self) -> np.dtype:
-        return self.arrays[0].dtype
-
-    @property
-    def shape(self) -> tuple[int, ...]:
-        return self.arrays[0].shape
-
-    @property
-    def ndim(self) -> int:
-        return self.arrays[0].ndim
-
-    def __getitem__(self, key) -> Self:
-        return type(self)([array[key] for array in self.arrays])
-
-
-def implements(numpy_function):
-    """Register an __array_function__ implementation for MyArray objects."""
-
-    def decorator(func):
-        MULTIARRAY_HANDLED_FUNCTIONS[numpy_function] = func
-        return func
-
-    return decorator
-
-
-@implements(np.expand_dims)
-def expand_dims_MultiArray(multiarray, axis):
-    return MultiArray(tuple(np.expand_dims(a, axis) for a in multiarray.arrays))
-
-
-@implements(np.concatenate)
-def concatenate_MultiArray(multiarrays, axis):
-    n_arrays = len(multiarrays[0].arrays)
-    for ma in multiarrays[1:]:
-        assert len(ma.arrays) == n_arrays
-    return MultiArray(
-        tuple(np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis) for i in range(n_arrays))
-    )
-
-
-@implements(np.transpose)
-def transpose_MultiArray(multiarray, axes):
-    return MultiArray(tuple(np.transpose(a, axes) for a in multiarray.arrays))
-
-
-@implements(np.full)
-def full_MultiArray(
-    shape, fill_values, *args, **kwargs
-):  # I've used *args, **kwargs instead of the full argument list to give us more flexibility if numpy changes stuff https://numpy.org/doc/stable/reference/generated/numpy.full.html
-    """All arguments except fill_value are shared by each array
-    in the MultiArray.
-    Iterate over fill_values to create arrays
-    """
-    return MultiArray(
-        tuple(
-            np.full(
-                shape, fv, *args, **kwargs
-            )  # I'm 90% sure I've used *args, **kwargs correctly here -- could you double-check?
-            for fv in fill_values
-        )
-    )
-
 
 def _prepare_for_flox(group_idx, array):
     """
diff --git a/flox/aggregations.py b/flox/aggregations.py
index 09649e41..ae46eb61 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -15,6 +15,7 @@
 from . import aggregate_flox, aggregate_npg, xrutils
 from . import xrdtypes as dtypes
 from .lib import dask_array_type, sparse_array_type
+from .multiarray import MultiArray
 
 if TYPE_CHECKING:
     FuncTuple = tuple[Callable | str, ...]
@@ -346,8 +347,6 @@ def _mean_finalize(sum_, count):
 def var_chunk(
     group_idx, array, *, skipna: bool, engine: str, axis=-1, size=None, fill_value=None, dtype=None
 ):
-    from .aggregate_flox import MultiArray
-
     # Calculate length and sum - important for the adjustment terms to sum squared deviations
     array_lens = generic_aggregate(
         group_idx,
@@ -432,22 +431,14 @@ def clip_first(array, n=1):
         "Instances where we add something to the denominator must come out to zero"
     )
 
-    return aggregate_flox.MultiArray(
+    return MultiArray(
         (
             np.sum(sum_deviations, axis=axis, keepdims=keepdims)
             + np.sum(adj_terms, axis=axis, keepdims=keepdims),  # sum of squared deviations
             np.sum(sum_X, axis=axis, keepdims=keepdims),  # sum of array items
             np.sum(sum_len, axis=axis, keepdims=keepdims),  # sum of array lengths
         )
-    )  # I'm not even pretending calling this class from there is a good idea, I think it wants to be somewhere else though
-
-
-# TODO: fix this for complex numbers
-# def _var_finalize(sumsq, sum_, count, ddof=0):
-# with np.errstate(invalid="ignore", divide="ignore"):
-# result = (sumsq - (sum_**2 / count)) / (count - ddof)
-# result[count <= ddof] = np.nan
-# return result
+    )
 
 
 def is_var_chunk_reduction(agg: Callable) -> bool:
diff --git a/flox/core.py b/flox/core.py
index d5cde638..577f93bf 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -2506,7 +2506,7 @@ def _choose_engine(by, agg: Aggregation):
 
     not_arg_reduce = not _is_arg_reduction(agg)
 
-    if agg.name in ["quantile", "nanquantile", "median", "nanmedian"]:
+    if agg.name in ["quantile", "nanquantile", "median", "nanmedian", "var", "nanvar", "std", "nanstd"]:
         logger.debug(f"_choose_engine: Choosing 'flox' since {agg.name}")
         return "flox"
 
diff --git a/flox/multiarray.py b/flox/multiarray.py
new file mode 100644
index 00000000..9a9f9e8f
--- /dev/null
+++ b/flox/multiarray.py
@@ -0,0 +1,91 @@
+from typing import Self
+
+import numpy as np
+
+MULTIARRAY_HANDLED_FUNCTIONS = {}
+
+
+class MultiArray:
+    arrays: tuple[np.ndarray, ...]
+
+    def __init__(self, arrays):
+        self.arrays = arrays
+        assert all(arrays[0].shape == a.shape for a in arrays), "Expect all arrays to have the same shape"
+
+    def astype(self, dt, **kwargs) -> Self:
+        return type(self)(tuple(array.astype(dt, **kwargs) for array in self.arrays))
+
+    def reshape(self, shape, **kwargs) -> Self:
+        return type(self)(tuple(array.reshape(shape, **kwargs) for array in self.arrays))
+
+    def squeeze(self, axis=None) -> Self:
+        return type(self)(tuple(array.squeeze(axis) for array in self.arrays))
+
+    def __setitem__(self, key, value) -> None:
+        assert len(value) == len(self.arrays)
+        for array, val in zip(self.arrays, value):
+            array[key] = val
+
+    def __array_function__(self, func, types, args, kwargs):
+        if func not in MULTIARRAY_HANDLED_FUNCTIONS:
+            return NotImplemented
+        # Note: this allows subclasses that don't override
+        # __array_function__ to handle MyArray objects
+        # if not all(issubclass(t, MyArray) for t in types): # I can't see this being relevant at all for this code, but maybe it's safer to leave it in?
+        # return NotImplemented
+        return MULTIARRAY_HANDLED_FUNCTIONS[func](*args, **kwargs)
+
+    # Shape is needed, seems likely that the other two might be
+    # Making some strong assumptions here that all the arrays are the same shape, and I don't really like this
+    @property
+    def dtype(self) -> np.dtype:
+        return self.arrays[0].dtype
+
+    @property
+    def shape(self) -> tuple[int, ...]:
+        return self.arrays[0].shape
+
+    @property
+    def ndim(self) -> int:
+        return self.arrays[0].ndim
+
+    def __getitem__(self, key) -> Self:
+        return type(self)([array[key] for array in self.arrays])
+
+
+def implements(numpy_function):
+    """Register an __array_function__ implementation for MyArray objects."""
+
+    def decorator(func):
+        MULTIARRAY_HANDLED_FUNCTIONS[numpy_function] = func
+        return func
+
+    return decorator
+
+
+@implements(np.expand_dims)
+def expand_dims(multiarray, axis) -> MultiArray:
+    return MultiArray(tuple(np.expand_dims(a, axis) for a in multiarray.arrays))
+
+
+@implements(np.concatenate)
+def concatenate(multiarrays, axis) -> MultiArray:
+    n_arrays = len(multiarrays[0].arrays)
+    for ma in multiarrays[1:]:
+        assert len(ma.arrays) == n_arrays
+    return MultiArray(
+        tuple(np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis) for i in range(n_arrays))
+    )
+
+
+@implements(np.transpose)
+def transpose(multiarray, axes) -> MultiArray:
+    return MultiArray(tuple(np.transpose(a, axes) for a in multiarray.arrays))
+
+
+@implements(np.full)
+def full(shape, fill_values, *args, **kwargs) -> MultiArray:
+    """All arguments except fill_value are shared by each array in the MultiArray.
+    Iterate over fill_values to create arrays
+    """
+    return MultiArray(tuple(np.full(shape, fv, *args, **kwargs) for fv in fill_values))
diff --git a/tests/test_core.py b/tests/test_core.py
index 5620be30..4a98d3d3 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -236,7 +236,7 @@ def gen_array_by(size, func):
 @pytest.mark.parametrize("size", [(1, 12), (12,), (12, 9)])
 @pytest.mark.parametrize("nby", [1, 2, 3])
 @pytest.mark.parametrize("add_nan_by", [True, False])
-@pytest.mark.parametrize("func", ["var", "nanvar", "std", "nanstd"])
+@pytest.mark.parametrize("func", ALL_FUNCS)
 def test_groupby_reduce_all(to_sparse, nby, size, chunks, func, add_nan_by, engine):
     if ("arg" in func and engine in ["flox", "numbagg"]) or (func in BLOCKWISE_FUNCS and chunks != -1):
         pytest.skip()
@@ -2242,13 +2242,12 @@ def test_sparse_nan_fill_value_reductions(chunks, fill_value, shape, func):
     assert_equal(actual, expected)
 
 
+@pytest.mark.parametrize("func", ("nanvar", "var"))
 @pytest.mark.parametrize(
-    "func", ("nanvar", "var")
-)  # Expect to expand this to other functions once written. "nanvar" has updated chunk, combine functions. "var", for the moment, still uses the old algorithm
-@pytest.mark.parametrize("engine", ("flox",))  # Expect to expand this to other engines once written
-@pytest.mark.parametrize(
-    "exponent", (2, 4, 6, 8, 10, 12)
-)  # Should fail at 10e8 for old algorithm, and survive 10e12 for current
+    # Should fail at 10e8 for old algorithm, and survive 10e12 for current
+    "exponent",
+    (2, 4, 6, 8, 10, 12),
+)
 def test_std_var_precision(func, exponent, engine):
     # Generate a dataset with small variance and big mean
     # Check that func with engine gives you the same answer as numpy

From 120fbf30cfa5a7e4046f24eeeca4f58517ccf45e Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 21:47:56 -0600
Subject: [PATCH 31/54] xfail some

---
 tests/test_core.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/tests/test_core.py b/tests/test_core.py
index 4a98d3d3..939b73a0 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2270,5 +2270,8 @@ def test_std_var_precision(func, exponent, engine):
 
     assert_equal(expected, no_offset, tol)
     assert_equal(expected_offset, with_offset, tol)
-    # Failure threshold in my external tests is dependent on dask chunksize, maybe needs exploring better?
-    assert_equal(no_offset, with_offset, tol)
+    if exponent < 10:
+        # TODO: figure this exponent limit
+        # TODO: Failure threshold in my external tests is dependent on dask chunksize,
+        #       maybe needs exploring better?
+        assert_equal(no_offset, with_offset, tol)

From 4541c4653f0039df115d8a163f46b48c9e7de176 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 21:54:45 -0600
Subject: [PATCH 32/54] revert some

---
 flox/core.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/core.py b/flox/core.py
index 577f93bf..d5cde638 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -2506,7 +2506,7 @@ def _choose_engine(by, agg: Aggregation):
 
     not_arg_reduce = not _is_arg_reduction(agg)
 
-    if agg.name in ["quantile", "nanquantile", "median", "nanmedian", "var", "nanvar", "std", "nanstd"]:
+    if agg.name in ["quantile", "nanquantile", "median", "nanmedian"]:
         logger.debug(f"_choose_engine: Choosing 'flox' since {agg.name}")
         return "flox"
 

From aa4b9b32cc9971869643ad0216a7f74651fe59c4 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 21:57:53 -0600
Subject: [PATCH 33/54] fix types

---
 flox/aggregations.py | 4 ++--
 flox/multiarray.py   | 3 ++-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index ae46eb61..38b66d28 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -162,8 +162,8 @@ def __init__(
         self,
         name: str,
         *,
-        numpy: str | None = None,
-        chunk: str | FuncTuple | None,
+        numpy: partial | str | None = None,
+        chunk: partial | str | FuncTuple | None,
         combine: str | FuncTuple | None,
         preprocess: Callable | None = None,
         finalize: Callable | None = None,
diff --git a/flox/multiarray.py b/flox/multiarray.py
index 9a9f9e8f..d9addd6f 100644
--- a/flox/multiarray.py
+++ b/flox/multiarray.py
@@ -1,8 +1,9 @@
+from collections.abc import Callable
 from typing import Self
 
 import numpy as np
 
-MULTIARRAY_HANDLED_FUNCTIONS = {}
+MULTIARRAY_HANDLED_FUNCTIONS: dict[Callable, Callable] = {}
 
 
 class MultiArray:

From d5c59e35e748ef960c4a50bf5f46d188b86c9cfa Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Sun, 17 Aug 2025 22:00:56 -0600
Subject: [PATCH 34/54] adjust tolerance

---
 tests/test_core.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_core.py b/tests/test_core.py
index 939b73a0..0cca23e3 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -2266,7 +2266,7 @@ def test_std_var_precision(func, exponent, engine):
         [np.nanvar(array[::2] + offset, keepdims=True), np.nanvar(array[1::2] + offset, keepdims=True)]
     )
 
-    tol = {"rtol": 1e-8, "atol": 1e-10}  # Not sure how stringent to be here
+    tol = {"rtol": 3e-8, "atol": 1e-9}  # Not sure how stringent to be here
 
     assert_equal(expected, no_offset, tol)
     assert_equal(expected_offset, with_offset, tol)

From b721433af5eaf7ded8ce8339264154b12e2a7cd6 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 19 Aug 2025 20:46:19 -0600
Subject: [PATCH 35/54] disable for cubed

---
 tests/test_core.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_core.py b/tests/test_core.py
index 0cca23e3..36d988ed 100644
--- a/tests/test_core.py
+++ b/tests/test_core.py
@@ -553,7 +553,7 @@ def test_groupby_agg_dask(func, shape, array_chunks, group_chunks, add_nan, dtyp
 def test_groupby_agg_cubed(func, shape, array_chunks, group_chunks, add_nan, engine, reindex):
     """Tests groupby_reduce with cubed arrays against groupby_reduce with numpy arrays"""
 
-    if func in ["first", "last"] or func in BLOCKWISE_FUNCS:
+    if func in ["first", "last", "var", "nanvar", "std", "nanstd"] or func in BLOCKWISE_FUNCS:
         pytest.skip()
 
     if "arg" in func and (engine in ["flox", "numbagg"] or reindex):

From 4f26ed82dfd73674700c231d79f914bb50c3b3ea Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 19 Aug 2025 20:48:37 -0600
Subject: [PATCH 36/54] handle nans in check

---
 flox/aggregations.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 38b66d28..333cc0b7 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -16,6 +16,7 @@
 from . import xrdtypes as dtypes
 from .lib import dask_array_type, sparse_array_type
 from .multiarray import MultiArray
+from .xrutils import notnull
 
 if TYPE_CHECKING:
     FuncTuple = tuple[Callable | str, ...]
@@ -427,7 +428,8 @@ def clip_first(array, n=1):
         + zero_denominator.astype(int)
     )
 
-    assert np.all((adj_terms * zero_denominator) == 0), (
+    check = adj_terms * zero_denominator
+    assert np.all(check[notnull(check)] == 0), (
         "Instances where we add something to the denominator must come out to zero"
     )
 

From d77c13291aae7b3976affb6985180e1613a2eb14 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 20 Aug 2025 15:58:47 +1000
Subject: [PATCH 37/54] Promote var/std to float64 from the beginning (dodgy)

---
 flox/aggregations.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 333cc0b7..14469af2 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -474,8 +474,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_var_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(None,),
-    final_dtype=np.floating,
+    dtypes=(np.float64,),
+    final_dtype=np.float64,
 )
 
 nanvar = Aggregation(
@@ -486,8 +486,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_var_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(None,),
-    final_dtype=np.floating,
+    dtypes=(np.float64,),
+    final_dtype=np.float64,
 )
 
 std = Aggregation(
@@ -498,8 +498,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_std_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(None,),
-    final_dtype=np.floating,
+    dtypes=(np.float64,),
+    final_dtype=np.float64,
 )
 nanstd = Aggregation(
     "nanstd",
@@ -509,8 +509,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_std_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(None,),
-    final_dtype=np.floating,
+    dtypes=(np.float64,),
+    final_dtype=np.float64,
 )
 
 

From 3cbe54c9b45c9f8faf7fdd758ad021d7b41c872a Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Tue, 26 Aug 2025 10:37:09 +1000
Subject: [PATCH 38/54] Revert "Promote var/std to float64 from the beginning
 (dodgy)"

This reverts commit d77c13291aae7b3976affb6985180e1613a2eb14.
---
 flox/aggregations.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 14469af2..333cc0b7 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -474,8 +474,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_var_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(np.float64,),
-    final_dtype=np.float64,
+    dtypes=(None,),
+    final_dtype=np.floating,
 )
 
 nanvar = Aggregation(
@@ -486,8 +486,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_var_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(np.float64,),
-    final_dtype=np.float64,
+    dtypes=(None,),
+    final_dtype=np.floating,
 )
 
 std = Aggregation(
@@ -498,8 +498,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_std_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(np.float64,),
-    final_dtype=np.float64,
+    dtypes=(None,),
+    final_dtype=np.floating,
 )
 nanstd = Aggregation(
     "nanstd",
@@ -509,8 +509,8 @@ def blockwise_or_numpy_var(*args, skipna: bool, ddof=0, std=False, **kwargs):
     finalize=_std_finalize,
     fill_value=((0, 0, 0),),
     final_fill_value=np.nan,
-    dtypes=(np.float64,),
-    final_dtype=np.float64,
+    dtypes=(None,),
+    final_dtype=np.floating,
 )
 
 

From d7d772c7fc5ab74b80620a7c0b281b137eaf422b Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 27 Aug 2025 11:56:11 +1000
Subject: [PATCH 39/54] Handle combine along multiple dimensions

---
 flox/aggregations.py | 80 +++++++++++++++++++++++---------------------
 flox/multiarray.py   |  4 ++-
 2 files changed, 45 insertions(+), 39 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 333cc0b7..0880cdb6 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -389,58 +389,62 @@ def var_chunk(
 
 
 def _var_combine(array, axis, keepdims=True):
-    def clip_last(array, n=1):
+    def clip_last(array, ax, n=1):
         """Return array except the last element along axis
         Purely included to tidy up the adj_terms line
         """
         assert n > 0, "Clipping nothing off the end isn't implemented"
         not_last = [slice(None, None) for i in range(array.ndim)]
-        not_last[axis[0]] = slice(None, -n)
+        not_last[ax] = slice(None, -n)
         return array[*not_last]
 
-    def clip_first(array, n=1):
+    def clip_first(array, ax, n=1):
         """Return array except the first element along axis
         Purely included to tidy up the adj_terms line
         """
         not_first = [slice(None, None) for i in range(array.ndim)]
-        not_first[axis[0]] = slice(n, None)
+        not_first[ax] = slice(n, None)
         return array[*not_first]
+    
+    for ax in axis:
+        if array.shape[ax] == 1:
+            continue
+
+        sum_deviations, sum_X, sum_len = array.arrays
+
+        # Calculate parts needed for cascading combination
+        cumsum_X = np.cumsum(sum_X, axis=ax)  # Don't need to be able to merge the last element
+        cumsum_len = np.cumsum(sum_len, axis=ax)
+
+        # There will be instances in which one or both chunks being merged are empty
+        # In which case, the adjustment term should be zero, but will throw a divide-by-zero error
+        # We're going to add a constant to the bottom of the adjustment term equation on those instances
+        # and count on the zeros on the top making our adjustment term still zero
+        zero_denominator = (clip_last(cumsum_len, ax) == 0) | (clip_first(sum_len, ax) == 0)
+
+        # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
+        adj_terms = (
+            clip_last(cumsum_len, ax) * clip_first(sum_X, ax) - clip_first(sum_len, ax) * clip_last(cumsum_X, ax)
+        ) ** 2 / (
+            clip_last(cumsum_len, ax) * clip_first(sum_len, ax) * (clip_last(cumsum_len, ax) + clip_first(sum_len, ax))
+            + zero_denominator.astype(int)
+        )
+    
+        check = adj_terms * zero_denominator
+        assert np.all(check[notnull(check)] == 0), (
+            "Instances where we add something to the denominator must come out to zero"
+        )
 
-    assert len(axis) == 1, "Assuming that the combine function is only in one direction at once"
-
-    sum_deviations, sum_X, sum_len = array.arrays
-
-    # Calculate parts needed for cascading combination
-    cumsum_X = np.cumsum(sum_X, axis=axis[0])  # Don't need to be able to merge the last element
-    cumsum_len = np.cumsum(sum_len, axis=axis[0])
-
-    # There will be instances in which one or both chunks being merged are empty
-    # In which case, the adjustment term should be zero, but will throw a divide-by-zero error
-    # We're going to add a constant to the bottom of the adjustment term equation on those instances
-    # and count on the zeros on the top making our adjustment term still zero
-    zero_denominator = (clip_last(cumsum_len) == 0) | (clip_first(sum_len) == 0)
-
-    # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
-    adj_terms = (
-        clip_last(cumsum_len) * clip_first(sum_X) - clip_first(sum_len) * clip_last(cumsum_X)
-    ) ** 2 / (
-        clip_last(cumsum_len) * clip_first(sum_len) * (clip_last(cumsum_len) + clip_first(sum_len))
-        + zero_denominator.astype(int)
-    )
-
-    check = adj_terms * zero_denominator
-    assert np.all(check[notnull(check)] == 0), (
-        "Instances where we add something to the denominator must come out to zero"
-    )
-
-    return MultiArray(
-        (
-            np.sum(sum_deviations, axis=axis, keepdims=keepdims)
-            + np.sum(adj_terms, axis=axis, keepdims=keepdims),  # sum of squared deviations
-            np.sum(sum_X, axis=axis, keepdims=keepdims),  # sum of array items
-            np.sum(sum_len, axis=axis, keepdims=keepdims),  # sum of array lengths
+        array =  MultiArray(
+            (
+                np.sum(sum_deviations, axis=axis, keepdims=keepdims)
+                + np.sum(adj_terms, axis=axis, keepdims=keepdims),  # sum of squared deviations
+                np.sum(sum_X, axis=axis, keepdims=keepdims),  # sum of array items
+                np.sum(sum_len, axis=axis, keepdims=keepdims),  # sum of array lengths
+            )
         )
-    )
+    return array
+
 
 
 def is_var_chunk_reduction(agg: Callable) -> bool:
diff --git a/flox/multiarray.py b/flox/multiarray.py
index d9addd6f..19d8e660 100644
--- a/flox/multiarray.py
+++ b/flox/multiarray.py
@@ -78,11 +78,13 @@ def concatenate(multiarrays, axis) -> MultiArray:
         tuple(np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis) for i in range(n_arrays))
     )
 
-
 @implements(np.transpose)
 def transpose(multiarray, axes) -> MultiArray:
     return MultiArray(tuple(np.transpose(a, axes) for a in multiarray.arrays))
 
+@implements(np.squeeze)
+def squeeze(multiarray, axis) -> MultiArray:
+    return MultiArray(tuple(np.squeeze(a, axis) for a in multiarray.arrays))
 
 @implements(np.full)
 def full(shape, fill_values, *args, **kwargs) -> MultiArray:

From 9a51095083edbc11663977ddb856f9c2c8a5ce1e Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Wed, 27 Aug 2025 01:56:25 +0000
Subject: [PATCH 40/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregations.py | 14 ++++++++------
 flox/multiarray.py   |  3 +++
 2 files changed, 11 insertions(+), 6 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 0880cdb6..8f63c8d8 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -405,7 +405,7 @@ def clip_first(array, ax, n=1):
         not_first = [slice(None, None) for i in range(array.ndim)]
         not_first[ax] = slice(n, None)
         return array[*not_first]
-    
+
     for ax in axis:
         if array.shape[ax] == 1:
             continue
@@ -424,18 +424,21 @@ def clip_first(array, ax, n=1):
 
         # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
         adj_terms = (
-            clip_last(cumsum_len, ax) * clip_first(sum_X, ax) - clip_first(sum_len, ax) * clip_last(cumsum_X, ax)
+            clip_last(cumsum_len, ax) * clip_first(sum_X, ax)
+            - clip_first(sum_len, ax) * clip_last(cumsum_X, ax)
         ) ** 2 / (
-            clip_last(cumsum_len, ax) * clip_first(sum_len, ax) * (clip_last(cumsum_len, ax) + clip_first(sum_len, ax))
+            clip_last(cumsum_len, ax)
+            * clip_first(sum_len, ax)
+            * (clip_last(cumsum_len, ax) + clip_first(sum_len, ax))
             + zero_denominator.astype(int)
         )
-    
+
         check = adj_terms * zero_denominator
         assert np.all(check[notnull(check)] == 0), (
             "Instances where we add something to the denominator must come out to zero"
         )
 
-        array =  MultiArray(
+        array = MultiArray(
             (
                 np.sum(sum_deviations, axis=axis, keepdims=keepdims)
                 + np.sum(adj_terms, axis=axis, keepdims=keepdims),  # sum of squared deviations
@@ -446,7 +449,6 @@ def clip_first(array, ax, n=1):
     return array
 
 
-
 def is_var_chunk_reduction(agg: Callable) -> bool:
     if isinstance(agg, partial):
         agg = agg.func
diff --git a/flox/multiarray.py b/flox/multiarray.py
index 19d8e660..20116099 100644
--- a/flox/multiarray.py
+++ b/flox/multiarray.py
@@ -78,14 +78,17 @@ def concatenate(multiarrays, axis) -> MultiArray:
         tuple(np.concatenate(tuple(ma.arrays[i] for ma in multiarrays), axis) for i in range(n_arrays))
     )
 
+
 @implements(np.transpose)
 def transpose(multiarray, axes) -> MultiArray:
     return MultiArray(tuple(np.transpose(a, axes) for a in multiarray.arrays))
 
+
 @implements(np.squeeze)
 def squeeze(multiarray, axis) -> MultiArray:
     return MultiArray(tuple(np.squeeze(a, axis) for a in multiarray.arrays))
 
+
 @implements(np.full)
 def full(shape, fill_values, *args, **kwargs) -> MultiArray:
     """All arguments except fill_value are shared by each array in the MultiArray.

From 1373318d69d7e9a79ce20dc1952b770933099e1f Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 27 Aug 2025 11:57:54 +1000
Subject: [PATCH 41/54] Comments

---
 flox/aggregations.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 8f63c8d8..445fd56b 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -413,7 +413,7 @@ def clip_first(array, ax, n=1):
         sum_deviations, sum_X, sum_len = array.arrays
 
         # Calculate parts needed for cascading combination
-        cumsum_X = np.cumsum(sum_X, axis=ax)  # Don't need to be able to merge the last element
+        cumsum_X = np.cumsum(sum_X, axis=ax) 
         cumsum_len = np.cumsum(sum_len, axis=ax)
 
         # There will be instances in which one or both chunks being merged are empty

From 4f1549574052f1ec325c83b548300cfb935ac784 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 27 Aug 2025 11:59:26 +1000
Subject: [PATCH 42/54] Technicalities regarding multiple dimensions in var
 combine

---
 flox/aggregations.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 445fd56b..a0d262d6 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -440,10 +440,10 @@ def clip_first(array, ax, n=1):
 
         array = MultiArray(
             (
-                np.sum(sum_deviations, axis=axis, keepdims=keepdims)
-                + np.sum(adj_terms, axis=axis, keepdims=keepdims),  # sum of squared deviations
-                np.sum(sum_X, axis=axis, keepdims=keepdims),  # sum of array items
-                np.sum(sum_len, axis=axis, keepdims=keepdims),  # sum of array lengths
+                np.sum(sum_deviations, axis=ax, keepdims=keepdims)
+                + np.sum(adj_terms, axis=ax, keepdims=keepdims),  # sum of squared deviations
+                np.sum(sum_X, axis=ax, keepdims=keepdims),  # sum of array items
+                np.sum(sum_len, axis=ax, keepdims=keepdims),  # sum of array lengths
             )
         )
     return array

From 591997c76f6f88338ec91011dcbad1d50603755f Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Wed, 27 Aug 2025 01:59:38 +0000
Subject: [PATCH 43/54] [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
---
 flox/aggregations.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index a0d262d6..38dc1218 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -413,7 +413,7 @@ def clip_first(array, ax, n=1):
         sum_deviations, sum_X, sum_len = array.arrays
 
         # Calculate parts needed for cascading combination
-        cumsum_X = np.cumsum(sum_X, axis=ax) 
+        cumsum_X = np.cumsum(sum_X, axis=ax)
         cumsum_len = np.cumsum(sum_len, axis=ax)
 
         # There will be instances in which one or both chunks being merged are empty

From bbc0be234ec4b2cdcb29ed73bf85e154d5b8ae66 Mon Sep 17 00:00:00 2001
From: jemmajeffree <98864717+jemmajeffree@users.noreply.github.com>
Date: Wed, 27 Aug 2025 12:18:22 +1000
Subject: [PATCH 44/54] more explicit NaNs in empty groups

---
 flox/aggregations.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 38dc1218..b82ce0cb 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -458,7 +458,7 @@ def is_var_chunk_reduction(agg: Callable) -> bool:
 def _var_finalize(multiarray, ddof=0):
     den = multiarray.arrays[2] - ddof
     # preserve nans for groups with 0 obs; so these values are -ddof
-    den[den < 0] = 0
+    den[den <= 0] = np.nan
     return multiarray.arrays[0] / den
 
 

From 63d7e96632599c00070138bd191326b86652d987 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Wed, 27 Aug 2025 21:06:13 -0600
Subject: [PATCH 45/54] Better "more explicit NaNs in empty groups"

---
 flox/aggregations.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index b82ce0cb..8b53d147 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -458,8 +458,9 @@ def is_var_chunk_reduction(agg: Callable) -> bool:
 def _var_finalize(multiarray, ddof=0):
     den = multiarray.arrays[2] - ddof
     # preserve nans for groups with 0 obs; so these values are -ddof
-    den[den <= 0] = np.nan
-    return multiarray.arrays[0] / den
+    ret = multiarray.arrays[0] / den
+    ret[den < 0] = np.nan
+    return ret
 
 
 def _std_finalize(multiarray, ddof=0):

From 779c1d2a567e7c87138455d2e4e56f6a703fc3a2 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 16 Sep 2025 07:02:58 -0600
Subject: [PATCH 46/54] Add skip

---
 flox/core.py             | 1 +
 tests/test_properties.py | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/flox/core.py b/flox/core.py
index 953dabf7..8681efed 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -2791,6 +2791,7 @@ def groupby_reduce(
             array = array.view(np.int64)
         elif is_cftime:
             offset = array.min()
+            assert offset is not None
             array = datetime_to_numeric(array, offset, datetime_unit="us")
 
     if nax == 1 and by_.ndim > 1 and expected_ is None:
diff --git a/tests/test_properties.py b/tests/test_properties.py
index a1b10511..527bdd85 100644
--- a/tests/test_properties.py
+++ b/tests/test_properties.py
@@ -99,7 +99,7 @@ def test_groupby_reduce(data, array, func: str) -> None:
 
     # TODO: funny bugs with overflows here
     is_cftime = _contains_cftime_datetimes(array)
-    assume(not (is_cftime and func in ["prod", "nanprod"]))
+    assume(not (is_cftime and func in ["prod", "nanprod", "var", "std", "nanvar", "nanstd"]))
 
     axis = -1
     by = data.draw(

From e4560815d792019a012f21c86f3c208413e8d584 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 16 Sep 2025 07:08:44 -0600
Subject: [PATCH 47/54] [revert]

---
 .github/workflows/ci.yaml | 2 +-
 flox/core.py              | 1 +
 tests/test_properties.py  | 5 +++--
 3 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml
index 48a7df79..c52145d1 100644
--- a/.github/workflows/ci.yaml
+++ b/.github/workflows/ci.yaml
@@ -71,7 +71,7 @@ jobs:
         id: status
         run: |
           uv run --no-dev python -c "import xarray; xarray.show_versions()" || true
-          uv run --no-dev pytest --durations=20 --durations-min=0.5 -n auto --cov=./ --cov-report=xml --hypothesis-profile ci
+          uv run --no-dev pytest --durations=20 --durations-min=0.5 -n auto --cov=./ --cov-report=xml --hypothesis-profile ci tests/test_properties.py::test_groupby_reduce
       - name: Upload code coverage to Codecov
         uses: codecov/codecov-action@v5.5.0
         with:
diff --git a/flox/core.py b/flox/core.py
index 8681efed..6cba5dd1 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -3002,6 +3002,7 @@ def groupby_reduce(
         elif is_cftime:
             asdelta = _to_pytimedelta(result, unit="us")
             nanmask = np.isnan(result)
+            print(result, asdelta, offset)
             asdelta[nanmask] = datetime.timedelta(microseconds=0)
             result = asdelta + offset
             result[nanmask] = np.timedelta64("NaT")
diff --git a/tests/test_properties.py b/tests/test_properties.py
index 527bdd85..4c6e31bf 100644
--- a/tests/test_properties.py
+++ b/tests/test_properties.py
@@ -14,7 +14,7 @@
 import hypothesis.extra.numpy as npst
 import hypothesis.strategies as st
 import numpy as np
-from hypothesis import assume, given, note, settings
+from hypothesis import assume, given, note, reproduce_failure, settings
 
 import flox
 from flox.core import _is_sparse_supported_reduction, groupby_reduce, groupby_scan
@@ -88,6 +88,7 @@ def not_overflowing_array(array: np.ndarray[Any, Any]) -> bool:
     func=func_st,
 )
 @settings(deadline=None)
+@reproduce_failure("6.138.16", b"AXicc2RyZHRkYHRkAmIGRwYGEM+J/QKQAvOhkNGRA8ICMgGmLQaD")
 def test_groupby_reduce(data, array, func: str) -> None:
     # overflow behaviour differs between bincount and sum (for example)
     assume(not_overflowing_array(array))
@@ -99,7 +100,7 @@ def test_groupby_reduce(data, array, func: str) -> None:
 
     # TODO: funny bugs with overflows here
     is_cftime = _contains_cftime_datetimes(array)
-    assume(not (is_cftime and func in ["prod", "nanprod", "var", "std", "nanvar", "nanstd"]))
+    assume(not (is_cftime and func in ["prod", "nanprod"]))
 
     axis = -1
     by = data.draw(

From 8eaddc1b00b5eced97edc9edd9263754fb7b5c2d Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 16 Sep 2025 07:54:56 -0600
Subject: [PATCH 48/54] [revert]

---
 flox/core.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/flox/core.py b/flox/core.py
index 6cba5dd1..4bdc71bd 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -3002,7 +3002,7 @@ def groupby_reduce(
         elif is_cftime:
             asdelta = _to_pytimedelta(result, unit="us")
             nanmask = np.isnan(result)
-            print(result, asdelta, offset)
+            print(array.compute(), result.compute(), np.array(asdelta), offset.compute())
             asdelta[nanmask] = datetime.timedelta(microseconds=0)
             result = asdelta + offset
             result[nanmask] = np.timedelta64("NaT")

From 2abaf3218d2d8417c59daddd43a6b2ac129a8f06 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Tue, 16 Sep 2025 21:28:56 -0600
Subject: [PATCH 49/54] fix

---
 flox/core.py             |   1 -
 tests/test_properties.py |   2 +-
 uv.lock                  | 176 +++++++++++++++++++++++++++++++++++++--
 3 files changed, 171 insertions(+), 8 deletions(-)

diff --git a/flox/core.py b/flox/core.py
index 4bdc71bd..8681efed 100644
--- a/flox/core.py
+++ b/flox/core.py
@@ -3002,7 +3002,6 @@ def groupby_reduce(
         elif is_cftime:
             asdelta = _to_pytimedelta(result, unit="us")
             nanmask = np.isnan(result)
-            print(array.compute(), result.compute(), np.array(asdelta), offset.compute())
             asdelta[nanmask] = datetime.timedelta(microseconds=0)
             result = asdelta + offset
             result[nanmask] = np.timedelta64("NaT")
diff --git a/tests/test_properties.py b/tests/test_properties.py
index 4c6e31bf..a974f834 100644
--- a/tests/test_properties.py
+++ b/tests/test_properties.py
@@ -100,7 +100,7 @@ def test_groupby_reduce(data, array, func: str) -> None:
 
     # TODO: funny bugs with overflows here
     is_cftime = _contains_cftime_datetimes(array)
-    assume(not (is_cftime and func in ["prod", "nanprod"]))
+    assume(not (is_cftime and func in ["prod", "nanprod", "var", "nanvar", "std", "nanstd"]))
 
     axis = -1
     by = data.draw(
diff --git a/uv.lock b/uv.lock
index 86c4f048..2688d630 100644
--- a/uv.lock
+++ b/uv.lock
@@ -251,6 +251,27 @@ css = [
     { name = "tinycss2" },
 ]
 
+[[package]]
+name = "bokeh"
+version = "3.8.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "contourpy" },
+    { name = "jinja2" },
+    { name = "narwhals" },
+    { name = "numpy" },
+    { name = "packaging" },
+    { name = "pandas" },
+    { name = "pillow" },
+    { name = "pyyaml" },
+    { name = "tornado", marker = "sys_platform != 'emscripten'" },
+    { name = "xyzservices" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/78/bd/8455ecfaa8100dbfbb2af40061c689a7a9c808f4f8c9582f0efd0c8c9a19/bokeh-3.8.0.tar.gz", hash = "sha256:bfdf5e9df910653b097f70cd38f4c2399d91af6e54a618126e2387cc33c9ec03", size = 6529746, upload-time = "2025-08-29T12:16:55.005Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/96/9a/8e641b5415e12036d8a206147b8229d917a767b7d939521458d90feddcf5/bokeh-3.8.0-py3-none-any.whl", hash = "sha256:117c5e559231ad39fef87891a1a1b62b3bfefbaa47d536023537338f46015841", size = 7205343, upload-time = "2025-08-29T12:16:52.77Z" },
+]
+
 [[package]]
 name = "build"
 version = "1.3.0"
@@ -828,6 +849,17 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/8e/56/55dda22a8dbe291032735f7025dd69d9a70e4c440279ae98cc7c3888aa70/dask-2025.9.0-py3-none-any.whl", hash = "sha256:cb8d74476dda10c558234c02d1639386cc5c9cef0252245cf77043fb1f2495d1", size = 1477763, upload-time = "2025-09-10T10:16:06.474Z" },
 ]
 
+[package.optional-dependencies]
+complete = [
+    { name = "bokeh" },
+    { name = "distributed" },
+    { name = "jinja2" },
+    { name = "lz4" },
+    { name = "numpy" },
+    { name = "pandas" },
+    { name = "pyarrow" },
+]
+
 [[package]]
 name = "debugpy"
 version = "1.8.16"
@@ -876,6 +908,32 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/33/6b/e0547afaf41bf2c42e52430072fa5658766e3d65bd4b03a563d1b6336f57/distlib-0.4.0-py2.py3-none-any.whl", hash = "sha256:9659f7d87e46584a30b5780e43ac7a2143098441670ff0a49d5f9034c54a6c16", size = 469047, upload-time = "2025-07-17T16:51:58.613Z" },
 ]
 
+[[package]]
+name = "distributed"
+version = "2025.9.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "click" },
+    { name = "cloudpickle" },
+    { name = "dask" },
+    { name = "jinja2" },
+    { name = "locket" },
+    { name = "msgpack" },
+    { name = "packaging" },
+    { name = "psutil" },
+    { name = "pyyaml" },
+    { name = "sortedcontainers" },
+    { name = "tblib" },
+    { name = "toolz" },
+    { name = "tornado" },
+    { name = "urllib3" },
+    { name = "zict" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/73/3f/115c2828366c08d631935a19575ebc23491788cb2a93baa1ad3e94b5358f/distributed-2025.9.0.tar.gz", hash = "sha256:f10e09d6f314e8959b97b633a44ce1807e89197445119fa313333c2df527d25a", size = 1101035, upload-time = "2025-09-10T10:15:19.382Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f9/b2/810bb4f4dfe5560d5eb36efda2221e51d1e38a04c3c10fa3cec311ce21e4/distributed-2025.9.0-py3-none-any.whl", hash = "sha256:87c35e4aefb5525d44032b40d7d780b4e9e398b6d567ca5bb6cc7b2150c48aa9", size = 1008961, upload-time = "2025-09-10T10:15:16.425Z" },
+]
+
 [[package]]
 name = "docutils"
 version = "0.21.2"
@@ -1038,7 +1096,7 @@ dev = [
     { name = "cftime" },
     { name = "codecov" },
     { name = "cubed" },
-    { name = "dask" },
+    { name = "dask", extra = ["complete"] },
     { name = "hypothesis" },
     { name = "ipykernel" },
     { name = "line-profiler" },
@@ -1277,7 +1335,7 @@ provides-extras = ["all", "test", "docs"]
 [package.metadata.requires-dev]
 all = [
     { name = "cachey" },
-    { name = "dask", extras = ["core"] },
+    { name = "dask" },
     { name = "numba" },
     { name = "numbagg", specifier = ">=0.3" },
     { name = "xarray" },
@@ -1299,7 +1357,7 @@ complete = [
     { name = "cftime" },
     { name = "codecov" },
     { name = "cubed", specifier = ">=0.20.0" },
-    { name = "dask", extras = ["core"] },
+    { name = "dask" },
     { name = "hypothesis" },
     { name = "lxml" },
     { name = "matplotlib" },
@@ -1323,8 +1381,8 @@ dev = [
     { name = "cftime" },
     { name = "codecov" },
     { name = "cubed", specifier = ">=0.20.0" },
-    { name = "dask", extras = ["all"] },
-    { name = "dask", extras = ["core"] },
+    { name = "dask" },
+    { name = "dask", extras = ["complete"] },
     { name = "hypothesis" },
     { name = "ipykernel" },
     { name = "line-profiler" },
@@ -1437,7 +1495,7 @@ numpy1 = [
     { name = "cftime" },
     { name = "codecov" },
     { name = "cubed", specifier = ">=0.20.0" },
-    { name = "dask", extras = ["core"] },
+    { name = "dask" },
     { name = "hypothesis" },
     { name = "lxml" },
     { name = "matplotlib" },
@@ -2401,6 +2459,38 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/b6/db/8f620f1ac62cf32554821b00b768dd5957ac8e3fd051593532be5b40b438/lxml-6.0.1-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:51bd5d1a9796ca253db6045ab45ca882c09c071deafffc22e06975b7ace36300", size = 3518127, upload-time = "2025-08-22T10:37:51.66Z" },
 ]
 
+[[package]]
+name = "lz4"
+version = "4.4.4"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/c6/5a/945f5086326d569f14c84ac6f7fcc3229f0b9b1e8cc536b951fd53dfb9e1/lz4-4.4.4.tar.gz", hash = "sha256:070fd0627ec4393011251a094e08ed9fdcc78cb4e7ab28f507638eee4e39abda", size = 171884, upload-time = "2025-04-01T22:55:58.62Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/28/e8/63843dc5ecb1529eb38e1761ceed04a0ad52a9ad8929ab8b7930ea2e4976/lz4-4.4.4-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:ddfc7194cd206496c445e9e5b0c47f970ce982c725c87bd22de028884125b68f", size = 220898, upload-time = "2025-04-01T22:55:23.085Z" },
+    { url = "https://files.pythonhosted.org/packages/e4/94/c53de5f07c7dc11cf459aab2a1d754f5df5f693bfacbbe1e4914bfd02f1e/lz4-4.4.4-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:714f9298c86f8e7278f1c6af23e509044782fa8220eb0260f8f8f1632f820550", size = 189685, upload-time = "2025-04-01T22:55:24.413Z" },
+    { url = "https://files.pythonhosted.org/packages/fe/59/c22d516dd0352f2a3415d1f665ccef2f3e74ecec3ca6a8f061a38f97d50d/lz4-4.4.4-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:a8474c91de47733856c6686df3c4aca33753741da7e757979369c2c0d32918ba", size = 1239225, upload-time = "2025-04-01T22:55:25.737Z" },
+    { url = "https://files.pythonhosted.org/packages/81/af/665685072e71f3f0e626221b7922867ec249cd8376aca761078c8f11f5da/lz4-4.4.4-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:80dd27d7d680ea02c261c226acf1d41de2fd77af4fb2da62b278a9376e380de0", size = 1265881, upload-time = "2025-04-01T22:55:26.817Z" },
+    { url = "https://files.pythonhosted.org/packages/90/04/b4557ae381d3aa451388a29755cc410066f5e2f78c847f66f154f4520a68/lz4-4.4.4-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:9b7d6dddfd01b49aedb940fdcaf32f41dc58c926ba35f4e31866aeec2f32f4f4", size = 1185593, upload-time = "2025-04-01T22:55:27.896Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/e4/03636979f4e8bf92c557f998ca98ee4e6ef92e92eaf0ed6d3c7f2524e790/lz4-4.4.4-cp311-cp311-win32.whl", hash = "sha256:4134b9fd70ac41954c080b772816bb1afe0c8354ee993015a83430031d686a4c", size = 88259, upload-time = "2025-04-01T22:55:29.03Z" },
+    { url = "https://files.pythonhosted.org/packages/07/f0/9efe53b4945441a5d2790d455134843ad86739855b7e6199977bf6dc8898/lz4-4.4.4-cp311-cp311-win_amd64.whl", hash = "sha256:f5024d3ca2383470f7c4ef4d0ed8eabad0b22b23eeefde1c192cf1a38d5e9f78", size = 99916, upload-time = "2025-04-01T22:55:29.933Z" },
+    { url = "https://files.pythonhosted.org/packages/87/c8/1675527549ee174b9e1db089f7ddfbb962a97314657269b1e0344a5eaf56/lz4-4.4.4-cp311-cp311-win_arm64.whl", hash = "sha256:6ea715bb3357ea1665f77874cf8f55385ff112553db06f3742d3cdcec08633f7", size = 89741, upload-time = "2025-04-01T22:55:31.184Z" },
+    { url = "https://files.pythonhosted.org/packages/f7/2d/5523b4fabe11cd98f040f715728d1932eb7e696bfe94391872a823332b94/lz4-4.4.4-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:23ae267494fdd80f0d2a131beff890cf857f1b812ee72dbb96c3204aab725553", size = 220669, upload-time = "2025-04-01T22:55:32.032Z" },
+    { url = "https://files.pythonhosted.org/packages/91/06/1a5bbcacbfb48d8ee5b6eb3fca6aa84143a81d92946bdb5cd6b005f1863e/lz4-4.4.4-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:fff9f3a1ed63d45cb6514bfb8293005dc4141341ce3500abdfeb76124c0b9b2e", size = 189661, upload-time = "2025-04-01T22:55:33.413Z" },
+    { url = "https://files.pythonhosted.org/packages/fa/08/39eb7ac907f73e11a69a11576a75a9e36406b3241c0ba41453a7eb842abb/lz4-4.4.4-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:1ea7f07329f85a8eda4d8cf937b87f27f0ac392c6400f18bea2c667c8b7f8ecc", size = 1238775, upload-time = "2025-04-01T22:55:34.835Z" },
+    { url = "https://files.pythonhosted.org/packages/e9/26/05840fbd4233e8d23e88411a066ab19f1e9de332edddb8df2b6a95c7fddc/lz4-4.4.4-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8ccab8f7f7b82f9fa9fc3b0ba584d353bd5aa818d5821d77d5b9447faad2aaad", size = 1265143, upload-time = "2025-04-01T22:55:35.933Z" },
+    { url = "https://files.pythonhosted.org/packages/b7/5d/5f2db18c298a419932f3ab2023deb689863cf8fd7ed875b1c43492479af2/lz4-4.4.4-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:e43e9d48b2daf80e486213128b0763deed35bbb7a59b66d1681e205e1702d735", size = 1185032, upload-time = "2025-04-01T22:55:37.454Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/e6/736ab5f128694b0f6aac58343bcf37163437ac95997276cd0be3ea4c3342/lz4-4.4.4-cp312-cp312-win32.whl", hash = "sha256:33e01e18e4561b0381b2c33d58e77ceee850a5067f0ece945064cbaac2176962", size = 88284, upload-time = "2025-04-01T22:55:38.536Z" },
+    { url = "https://files.pythonhosted.org/packages/40/b8/243430cb62319175070e06e3a94c4c7bd186a812e474e22148ae1290d47d/lz4-4.4.4-cp312-cp312-win_amd64.whl", hash = "sha256:d21d1a2892a2dcc193163dd13eaadabb2c1b803807a5117d8f8588b22eaf9f12", size = 99918, upload-time = "2025-04-01T22:55:39.628Z" },
+    { url = "https://files.pythonhosted.org/packages/6c/e1/0686c91738f3e6c2e1a243e0fdd4371667c4d2e5009b0a3605806c2aa020/lz4-4.4.4-cp312-cp312-win_arm64.whl", hash = "sha256:2f4f2965c98ab254feddf6b5072854a6935adab7bc81412ec4fe238f07b85f62", size = 89736, upload-time = "2025-04-01T22:55:40.5Z" },
+    { url = "https://files.pythonhosted.org/packages/3b/3c/d1d1b926d3688263893461e7c47ed7382a969a0976fc121fc678ec325fc6/lz4-4.4.4-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:ed6eb9f8deaf25ee4f6fad9625d0955183fdc90c52b6f79a76b7f209af1b6e54", size = 220678, upload-time = "2025-04-01T22:55:41.78Z" },
+    { url = "https://files.pythonhosted.org/packages/26/89/8783d98deb058800dabe07e6cdc90f5a2a8502a9bad8c5343c641120ace2/lz4-4.4.4-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:18ae4fe3bafb344dbd09f976d45cbf49c05c34416f2462828f9572c1fa6d5af7", size = 189670, upload-time = "2025-04-01T22:55:42.775Z" },
+    { url = "https://files.pythonhosted.org/packages/22/ab/a491ace69a83a8914a49f7391e92ca0698f11b28d5ce7b2ececa2be28e9a/lz4-4.4.4-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:57fd20c5fc1a49d1bbd170836fccf9a338847e73664f8e313dce6ac91b8c1e02", size = 1238746, upload-time = "2025-04-01T22:55:43.797Z" },
+    { url = "https://files.pythonhosted.org/packages/97/12/a1f2f4fdc6b7159c0d12249456f9fe454665b6126e98dbee9f2bd3cf735c/lz4-4.4.4-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e9cb387c33f014dae4db8cb4ba789c8d2a0a6d045ddff6be13f6c8d9def1d2a6", size = 1265119, upload-time = "2025-04-01T22:55:44.943Z" },
+    { url = "https://files.pythonhosted.org/packages/50/6e/e22e50f5207649db6ea83cd31b79049118305be67e96bec60becf317afc6/lz4-4.4.4-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:d0be9f68240231e1e44118a4ebfecd8a5d4184f0bdf5c591c98dd6ade9720afd", size = 1184954, upload-time = "2025-04-01T22:55:46.161Z" },
+    { url = "https://files.pythonhosted.org/packages/4c/c4/2a458039645fcc6324ece731d4d1361c5daf960b553d1fcb4261ba07d51c/lz4-4.4.4-cp313-cp313-win32.whl", hash = "sha256:e9ec5d45ea43684f87c316542af061ef5febc6a6b322928f059ce1fb289c298a", size = 88289, upload-time = "2025-04-01T22:55:47.601Z" },
+    { url = "https://files.pythonhosted.org/packages/00/96/b8e24ea7537ab418074c226279acfcaa470e1ea8271003e24909b6db942b/lz4-4.4.4-cp313-cp313-win_amd64.whl", hash = "sha256:a760a175b46325b2bb33b1f2bbfb8aa21b48e1b9653e29c10b6834f9bb44ead4", size = 99925, upload-time = "2025-04-01T22:55:48.463Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/a5/f9838fe6aa132cfd22733ed2729d0592259fff074cefb80f19aa0607367b/lz4-4.4.4-cp313-cp313-win_arm64.whl", hash = "sha256:f4c21648d81e0dda38b4720dccc9006ae33b0e9e7ffe88af6bf7d4ec124e2fba", size = 89743, upload-time = "2025-04-01T22:55:49.716Z" },
+]
+
 [[package]]
 name = "markdown-it-py"
 version = "3.0.0"
@@ -2630,6 +2720,44 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/7a/f0/8282d9641415e9e33df173516226b404d367a0fc55e1a60424a152913abc/mistune-3.1.4-py3-none-any.whl", hash = "sha256:93691da911e5d9d2e23bc54472892aff676df27a75274962ff9edc210364266d", size = 53481, upload-time = "2025-08-29T07:20:42.218Z" },
 ]
 
+[[package]]
+name = "msgpack"
+version = "1.1.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/45/b1/ea4f68038a18c77c9467400d166d74c4ffa536f34761f7983a104357e614/msgpack-1.1.1.tar.gz", hash = "sha256:77b79ce34a2bdab2594f490c8e80dd62a02d650b91a75159a63ec413b8d104cd", size = 173555, upload-time = "2025-06-13T06:52:51.324Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/7f/83/97f24bf9848af23fe2ba04380388216defc49a8af6da0c28cc636d722502/msgpack-1.1.1-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:71ef05c1726884e44f8b1d1773604ab5d4d17729d8491403a705e649116c9558", size = 82728, upload-time = "2025-06-13T06:51:50.68Z" },
+    { url = "https://files.pythonhosted.org/packages/aa/7f/2eaa388267a78401f6e182662b08a588ef4f3de6f0eab1ec09736a7aaa2b/msgpack-1.1.1-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:36043272c6aede309d29d56851f8841ba907a1a3d04435e43e8a19928e243c1d", size = 79279, upload-time = "2025-06-13T06:51:51.72Z" },
+    { url = "https://files.pythonhosted.org/packages/f8/46/31eb60f4452c96161e4dfd26dbca562b4ec68c72e4ad07d9566d7ea35e8a/msgpack-1.1.1-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:a32747b1b39c3ac27d0670122b57e6e57f28eefb725e0b625618d1b59bf9d1e0", size = 423859, upload-time = "2025-06-13T06:51:52.749Z" },
+    { url = "https://files.pythonhosted.org/packages/45/16/a20fa8c32825cc7ae8457fab45670c7a8996d7746ce80ce41cc51e3b2bd7/msgpack-1.1.1-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8a8b10fdb84a43e50d38057b06901ec9da52baac6983d3f709d8507f3889d43f", size = 429975, upload-time = "2025-06-13T06:51:53.97Z" },
+    { url = "https://files.pythonhosted.org/packages/86/ea/6c958e07692367feeb1a1594d35e22b62f7f476f3c568b002a5ea09d443d/msgpack-1.1.1-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:ba0c325c3f485dc54ec298d8b024e134acf07c10d494ffa24373bea729acf704", size = 413528, upload-time = "2025-06-13T06:51:55.507Z" },
+    { url = "https://files.pythonhosted.org/packages/75/05/ac84063c5dae79722bda9f68b878dc31fc3059adb8633c79f1e82c2cd946/msgpack-1.1.1-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:88daaf7d146e48ec71212ce21109b66e06a98e5e44dca47d853cbfe171d6c8d2", size = 413338, upload-time = "2025-06-13T06:51:57.023Z" },
+    { url = "https://files.pythonhosted.org/packages/69/e8/fe86b082c781d3e1c09ca0f4dacd457ede60a13119b6ce939efe2ea77b76/msgpack-1.1.1-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:d8b55ea20dc59b181d3f47103f113e6f28a5e1c89fd5b67b9140edb442ab67f2", size = 422658, upload-time = "2025-06-13T06:51:58.419Z" },
+    { url = "https://files.pythonhosted.org/packages/3b/2b/bafc9924df52d8f3bb7c00d24e57be477f4d0f967c0a31ef5e2225e035c7/msgpack-1.1.1-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:4a28e8072ae9779f20427af07f53bbb8b4aa81151054e882aee333b158da8752", size = 427124, upload-time = "2025-06-13T06:51:59.969Z" },
+    { url = "https://files.pythonhosted.org/packages/a2/3b/1f717e17e53e0ed0b68fa59e9188f3f610c79d7151f0e52ff3cd8eb6b2dc/msgpack-1.1.1-cp311-cp311-win32.whl", hash = "sha256:7da8831f9a0fdb526621ba09a281fadc58ea12701bc709e7b8cbc362feabc295", size = 65016, upload-time = "2025-06-13T06:52:01.294Z" },
+    { url = "https://files.pythonhosted.org/packages/48/45/9d1780768d3b249accecc5a38c725eb1e203d44a191f7b7ff1941f7df60c/msgpack-1.1.1-cp311-cp311-win_amd64.whl", hash = "sha256:5fd1b58e1431008a57247d6e7cc4faa41c3607e8e7d4aaf81f7c29ea013cb458", size = 72267, upload-time = "2025-06-13T06:52:02.568Z" },
+    { url = "https://files.pythonhosted.org/packages/e3/26/389b9c593eda2b8551b2e7126ad3a06af6f9b44274eb3a4f054d48ff7e47/msgpack-1.1.1-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:ae497b11f4c21558d95de9f64fff7053544f4d1a17731c866143ed6bb4591238", size = 82359, upload-time = "2025-06-13T06:52:03.909Z" },
+    { url = "https://files.pythonhosted.org/packages/ab/65/7d1de38c8a22cf8b1551469159d4b6cf49be2126adc2482de50976084d78/msgpack-1.1.1-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:33be9ab121df9b6b461ff91baac6f2731f83d9b27ed948c5b9d1978ae28bf157", size = 79172, upload-time = "2025-06-13T06:52:05.246Z" },
+    { url = "https://files.pythonhosted.org/packages/0f/bd/cacf208b64d9577a62c74b677e1ada005caa9b69a05a599889d6fc2ab20a/msgpack-1.1.1-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:6f64ae8fe7ffba251fecb8408540c34ee9df1c26674c50c4544d72dbf792e5ce", size = 425013, upload-time = "2025-06-13T06:52:06.341Z" },
+    { url = "https://files.pythonhosted.org/packages/4d/ec/fd869e2567cc9c01278a736cfd1697941ba0d4b81a43e0aa2e8d71dab208/msgpack-1.1.1-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a494554874691720ba5891c9b0b39474ba43ffb1aaf32a5dac874effb1619e1a", size = 426905, upload-time = "2025-06-13T06:52:07.501Z" },
+    { url = "https://files.pythonhosted.org/packages/55/2a/35860f33229075bce803a5593d046d8b489d7ba2fc85701e714fc1aaf898/msgpack-1.1.1-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:cb643284ab0ed26f6957d969fe0dd8bb17beb567beb8998140b5e38a90974f6c", size = 407336, upload-time = "2025-06-13T06:52:09.047Z" },
+    { url = "https://files.pythonhosted.org/packages/8c/16/69ed8f3ada150bf92745fb4921bd621fd2cdf5a42e25eb50bcc57a5328f0/msgpack-1.1.1-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:d275a9e3c81b1093c060c3837e580c37f47c51eca031f7b5fb76f7b8470f5f9b", size = 409485, upload-time = "2025-06-13T06:52:10.382Z" },
+    { url = "https://files.pythonhosted.org/packages/c6/b6/0c398039e4c6d0b2e37c61d7e0e9d13439f91f780686deb8ee64ecf1ae71/msgpack-1.1.1-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:4fd6b577e4541676e0cc9ddc1709d25014d3ad9a66caa19962c4f5de30fc09ef", size = 412182, upload-time = "2025-06-13T06:52:11.644Z" },
+    { url = "https://files.pythonhosted.org/packages/b8/d0/0cf4a6ecb9bc960d624c93effaeaae75cbf00b3bc4a54f35c8507273cda1/msgpack-1.1.1-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:bb29aaa613c0a1c40d1af111abf025f1732cab333f96f285d6a93b934738a68a", size = 419883, upload-time = "2025-06-13T06:52:12.806Z" },
+    { url = "https://files.pythonhosted.org/packages/62/83/9697c211720fa71a2dfb632cad6196a8af3abea56eece220fde4674dc44b/msgpack-1.1.1-cp312-cp312-win32.whl", hash = "sha256:870b9a626280c86cff9c576ec0d9cbcc54a1e5ebda9cd26dab12baf41fee218c", size = 65406, upload-time = "2025-06-13T06:52:14.271Z" },
+    { url = "https://files.pythonhosted.org/packages/c0/23/0abb886e80eab08f5e8c485d6f13924028602829f63b8f5fa25a06636628/msgpack-1.1.1-cp312-cp312-win_amd64.whl", hash = "sha256:5692095123007180dca3e788bb4c399cc26626da51629a31d40207cb262e67f4", size = 72558, upload-time = "2025-06-13T06:52:15.252Z" },
+    { url = "https://files.pythonhosted.org/packages/a1/38/561f01cf3577430b59b340b51329803d3a5bf6a45864a55f4ef308ac11e3/msgpack-1.1.1-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:3765afa6bd4832fc11c3749be4ba4b69a0e8d7b728f78e68120a157a4c5d41f0", size = 81677, upload-time = "2025-06-13T06:52:16.64Z" },
+    { url = "https://files.pythonhosted.org/packages/09/48/54a89579ea36b6ae0ee001cba8c61f776451fad3c9306cd80f5b5c55be87/msgpack-1.1.1-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:8ddb2bcfd1a8b9e431c8d6f4f7db0773084e107730ecf3472f1dfe9ad583f3d9", size = 78603, upload-time = "2025-06-13T06:52:17.843Z" },
+    { url = "https://files.pythonhosted.org/packages/a0/60/daba2699b308e95ae792cdc2ef092a38eb5ee422f9d2fbd4101526d8a210/msgpack-1.1.1-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:196a736f0526a03653d829d7d4c5500a97eea3648aebfd4b6743875f28aa2af8", size = 420504, upload-time = "2025-06-13T06:52:18.982Z" },
+    { url = "https://files.pythonhosted.org/packages/20/22/2ebae7ae43cd8f2debc35c631172ddf14e2a87ffcc04cf43ff9df9fff0d3/msgpack-1.1.1-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9d592d06e3cc2f537ceeeb23d38799c6ad83255289bb84c2e5792e5a8dea268a", size = 423749, upload-time = "2025-06-13T06:52:20.211Z" },
+    { url = "https://files.pythonhosted.org/packages/40/1b/54c08dd5452427e1179a40b4b607e37e2664bca1c790c60c442c8e972e47/msgpack-1.1.1-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:4df2311b0ce24f06ba253fda361f938dfecd7b961576f9be3f3fbd60e87130ac", size = 404458, upload-time = "2025-06-13T06:52:21.429Z" },
+    { url = "https://files.pythonhosted.org/packages/2e/60/6bb17e9ffb080616a51f09928fdd5cac1353c9becc6c4a8abd4e57269a16/msgpack-1.1.1-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:e4141c5a32b5e37905b5940aacbc59739f036930367d7acce7a64e4dec1f5e0b", size = 405976, upload-time = "2025-06-13T06:52:22.995Z" },
+    { url = "https://files.pythonhosted.org/packages/ee/97/88983e266572e8707c1f4b99c8fd04f9eb97b43f2db40e3172d87d8642db/msgpack-1.1.1-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:b1ce7f41670c5a69e1389420436f41385b1aa2504c3b0c30620764b15dded2e7", size = 408607, upload-time = "2025-06-13T06:52:24.152Z" },
+    { url = "https://files.pythonhosted.org/packages/bc/66/36c78af2efaffcc15a5a61ae0df53a1d025f2680122e2a9eb8442fed3ae4/msgpack-1.1.1-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:4147151acabb9caed4e474c3344181e91ff7a388b888f1e19ea04f7e73dc7ad5", size = 424172, upload-time = "2025-06-13T06:52:25.704Z" },
+    { url = "https://files.pythonhosted.org/packages/8c/87/a75eb622b555708fe0427fab96056d39d4c9892b0c784b3a721088c7ee37/msgpack-1.1.1-cp313-cp313-win32.whl", hash = "sha256:500e85823a27d6d9bba1d057c871b4210c1dd6fb01fbb764e37e4e8847376323", size = 65347, upload-time = "2025-06-13T06:52:26.846Z" },
+    { url = "https://files.pythonhosted.org/packages/ca/91/7dc28d5e2a11a5ad804cf2b7f7a5fcb1eb5a4966d66a5d2b41aee6376543/msgpack-1.1.1-cp313-cp313-win_amd64.whl", hash = "sha256:6d489fba546295983abd142812bda76b57e33d0b9f5d5b71c09a583285506f69", size = 72341, upload-time = "2025-06-13T06:52:27.835Z" },
+]
+
 [[package]]
 name = "mypy"
 version = "1.18.1"
@@ -2715,6 +2843,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/5f/df/76d0321c3797b54b60fef9ec3bd6f4cfd124b9e422182156a1dd418722cf/myst_parser-4.0.1-py3-none-any.whl", hash = "sha256:9134e88959ec3b5780aedf8a99680ea242869d012e8821db3126d427edc9c95d", size = 84579, upload-time = "2025-02-12T10:53:02.078Z" },
 ]
 
+[[package]]
+name = "narwhals"
+version = "2.5.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/7b/b8/3cb005704866f1cc19e8d6b15d0467255821ba12d82f20ea15912672e54c/narwhals-2.5.0.tar.gz", hash = "sha256:8ae0b6f39597f14c0dc52afc98949d6f8be89b5af402d2d98101d2f7d3561418", size = 558573, upload-time = "2025-09-12T10:04:24.436Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f8/5a/22741c5c0e5f6e8050242bfc2052ba68bc94b1735ed5bca35404d136d6ec/narwhals-2.5.0-py3-none-any.whl", hash = "sha256:7e213f9ca7db3f8bf6f7eff35eaee6a1cf80902997e1b78d49b7755775d8f423", size = 407296, upload-time = "2025-09-12T10:04:22.524Z" },
+]
+
 [[package]]
 name = "nbclient"
 version = "0.10.2"
@@ -4272,6 +4409,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/40/44/4a5f08c96eb108af5cb50b41f76142f0afa346dfa99d5296fe7202a11854/tabulate-0.9.0-py3-none-any.whl", hash = "sha256:024ca478df22e9340661486f85298cff5f6dcdba14f3813e8830015b9ed1948f", size = 35252, upload-time = "2022-10-06T17:21:44.262Z" },
 ]
 
+[[package]]
+name = "tblib"
+version = "3.1.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/54/95/4b3044ec4bf248186769629bbfb495a458deb6e4c1f9eff7f298ae1e336e/tblib-3.1.0.tar.gz", hash = "sha256:06404c2c9f07f66fee2d7d6ad43accc46f9c3361714d9b8426e7f47e595cd652", size = 30766, upload-time = "2025-03-31T12:58:27.473Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/27/44/aa5c8b10b2cce7a053018e0d132bd58e27527a0243c4985383d5b6fd93e9/tblib-3.1.0-py3-none-any.whl", hash = "sha256:670bb4582578134b3d81a84afa1b016128b429f3d48e6cbbaecc9d15675e984e", size = 12552, upload-time = "2025-03-31T12:58:26.142Z" },
+]
+
 [[package]]
 name = "tenacity"
 version = "9.1.2"
@@ -4622,6 +4768,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/8d/f0/73c24457c941b8b08f7d090853e40f4b2cdde88b5da721f3f28e98df77c9/xarray-2025.9.0-py3-none-any.whl", hash = "sha256:79f0e25fb39571f612526ee998ee5404d8725a1db3951aabffdb287388885df0", size = 1349595, upload-time = "2025-09-04T04:20:24.36Z" },
 ]
 
+[[package]]
+name = "xyzservices"
+version = "2025.4.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/00/af/c0f7f97bb320d14c089476f487b81f733238cc5603e0914f2e409f49d589/xyzservices-2025.4.0.tar.gz", hash = "sha256:6fe764713648fac53450fbc61a3c366cb6ae5335a1b2ae0c3796b495de3709d8", size = 1134722, upload-time = "2025-04-25T10:38:09.669Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d6/7d/b77455d7c7c51255b2992b429107fab811b2e36ceaf76da1e55a045dc568/xyzservices-2025.4.0-py3-none-any.whl", hash = "sha256:8d4db9a59213ccb4ce1cf70210584f30b10795bff47627cdfb862b39ff6e10c9", size = 90391, upload-time = "2025-04-25T10:38:08.468Z" },
+]
+
 [[package]]
 name = "zarr"
 version = "3.1.2"
@@ -4638,6 +4793,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/e0/a3/d3d4fd394a10b1256f9dccb2fe0ddd125fc575d7c437b1c70df050f14176/zarr-3.1.2-py3-none-any.whl", hash = "sha256:c3e180f53ee0ef91b86f7feff6f9dd381ddd1b512d1a46580530966a493387b6", size = 261041, upload-time = "2025-08-25T15:32:29.522Z" },
 ]
 
+[[package]]
+name = "zict"
+version = "3.0.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/d1/ac/3c494dd7ec5122cff8252c1a209b282c0867af029f805ae9befd73ae37eb/zict-3.0.0.tar.gz", hash = "sha256:e321e263b6a97aafc0790c3cfb3c04656b7066e6738c37fffcca95d803c9fba5", size = 33238, upload-time = "2023-04-17T21:41:16.041Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/80/ab/11a76c1e2126084fde2639514f24e6111b789b0bfa4fc6264a8975c7e1f1/zict-3.0.0-py2.py3-none-any.whl", hash = "sha256:5796e36bd0e0cc8cf0fbc1ace6a68912611c1dbd74750a3f3026b9b9d6a327ae", size = 43332, upload-time = "2023-04-17T21:41:13.444Z" },
+]
+
 [[package]]
 name = "zipp"
 version = "3.23.0"

From b4f3628d15c224755366de380daefcf449e50365 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Wed, 17 Sep 2025 21:02:42 -0600
Subject: [PATCH 50/54] more reert

---
 .github/workflows/ci.yaml | 4 ++--
 tests/test_properties.py  | 3 +--
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml
index c52145d1..d3d20fb2 100644
--- a/.github/workflows/ci.yaml
+++ b/.github/workflows/ci.yaml
@@ -71,7 +71,7 @@ jobs:
         id: status
         run: |
           uv run --no-dev python -c "import xarray; xarray.show_versions()" || true
-          uv run --no-dev pytest --durations=20 --durations-min=0.5 -n auto --cov=./ --cov-report=xml --hypothesis-profile ci tests/test_properties.py::test_groupby_reduce
+          uv run --no-dev pytest --durations=20 --durations-min=0.5 -n auto --cov=./ --cov-report=xml --hypothesis-profile ci
       - name: Upload code coverage to Codecov
         uses: codecov/codecov-action@v5.5.0
         with:
@@ -106,7 +106,7 @@ jobs:
           cache-dependency-glob: "pyproject.toml"
       - name: Install xarray and dependencies
         run: |
-          uv add --dev .[complete] pint>=0.22
+          uv add --dev ".[complete]" "pint>=0.22"
       - name: Install upstream flox
         run: |
           uv add git+https://github.com/dcherian/flox.git@${{ github.ref }}
diff --git a/tests/test_properties.py b/tests/test_properties.py
index a974f834..d243cdca 100644
--- a/tests/test_properties.py
+++ b/tests/test_properties.py
@@ -14,7 +14,7 @@
 import hypothesis.extra.numpy as npst
 import hypothesis.strategies as st
 import numpy as np
-from hypothesis import assume, given, note, reproduce_failure, settings
+from hypothesis import assume, given, note, settings
 
 import flox
 from flox.core import _is_sparse_supported_reduction, groupby_reduce, groupby_scan
@@ -88,7 +88,6 @@ def not_overflowing_array(array: np.ndarray[Any, Any]) -> bool:
     func=func_st,
 )
 @settings(deadline=None)
-@reproduce_failure("6.138.16", b"AXicc2RyZHRkYHRkAmIGRwYGEM+J/QKQAvOhkNGRA8ICMgGmLQaD")
 def test_groupby_reduce(data, array, func: str) -> None:
     # overflow behaviour differs between bincount and sum (for example)
     assume(not_overflowing_array(array))

From 28d446441dd89b2bf91a11cebe5964f12540e66e Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Wed, 17 Sep 2025 22:20:04 -0600
Subject: [PATCH 51/54] FIx overflowing check

---
 tests/test_properties.py | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/tests/test_properties.py b/tests/test_properties.py
index d243cdca..d79770d1 100644
--- a/tests/test_properties.py
+++ b/tests/test_properties.py
@@ -66,18 +66,23 @@ def bfill(array, axis, dtype=None):
 def not_overflowing_array(array: np.ndarray[Any, Any]) -> bool:
     if array.dtype.kind in "Mm":
         array = array.view(np.int64)
+    array = array.ravel()
+    array = array[notnull(array)]
+
     if array.dtype.kind == "f":
-        info = np.finfo(array.dtype)
+        info = np.finfo(array.dtype)  # type: ignore[assignment]
+        limit = 2 ** (info.nmant + 1)
     elif array.dtype.kind in ["i", "u"]:
         info = np.iinfo(array.dtype)  # type: ignore[assignment]
     else:
         return True
 
-    array = array.ravel()
-    array = array[notnull(array)]
     with warnings.catch_warnings():
         warnings.simplefilter("ignore", RuntimeWarning)
         result = bool(np.all((array < info.max / array.size) & (array > info.min / array.size)))
+        if array.dtype.kind == "f":
+            result = result and bool(np.all(np.abs(array) < limit / array.size))
+
     # note(f"returning {result}, {array.min()} vs {info.min}, {array.max()} vs {info.max}")
     return result
 
@@ -203,7 +208,7 @@ def test_groupby_reduce_numpy_vs_other(data, array, func: str) -> None:
     result_other, *_ = groupby_reduce(array, by, **kwargs)
     result_numpy, *_ = groupby_reduce(numpy_array, by, **kwargs)
     assert isinstance(result_other, type(array))
-    assert_equal(result_numpy, result_other)
+    assert_equal(result_other, result_numpy)
 
 
 @given(

From 4360f6a1dcc06356c257227b43e7b3f1aa8dae5a Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Wed, 17 Sep 2025 22:26:35 -0600
Subject: [PATCH 52/54] fi type

---
 tests/test_properties.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_properties.py b/tests/test_properties.py
index d79770d1..a8542afd 100644
--- a/tests/test_properties.py
+++ b/tests/test_properties.py
@@ -70,7 +70,7 @@ def not_overflowing_array(array: np.ndarray[Any, Any]) -> bool:
     array = array[notnull(array)]
 
     if array.dtype.kind == "f":
-        info = np.finfo(array.dtype)  # type: ignore[assignment]
+        info = np.finfo(array.dtype)
         limit = 2 ** (info.nmant + 1)
     elif array.dtype.kind in ["i", "u"]:
         info = np.iinfo(array.dtype)  # type: ignore[assignment]

From 837afe9a5bb599cad2240d4a8e305f6078a90e3a Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Wed, 17 Sep 2025 22:27:08 -0600
Subject: [PATCH 53/54] silence warning

---
 pyproject.toml | 11 -----------
 1 file changed, 11 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 887aeb7a..494dcdff 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -169,17 +169,6 @@ testpaths = ["tests"]
 ignore-words-list = "nd,nax,coo"
 skip = "*.html"
 
-[tool.uv]
-dev-dependencies = [
-    "hypothesis",
-    "pytest>=7",
-    "pytest-cov",
-    "pytest-pretty",
-    "pytest-xdist",
-    "syrupy",
-    "pooch",
-    "codecov",
-]
 
 
 

From eafb34a2fadf7350e2ca5ac218fef9c46bc5526d Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Thu, 18 Sep 2025 08:16:45 -0600
Subject: [PATCH 54/54] Fix test

---
 flox/aggregations.py     | 29 +++++++++++++++++------------
 tests/test_properties.py |  2 ++
 2 files changed, 19 insertions(+), 12 deletions(-)

diff --git a/flox/aggregations.py b/flox/aggregations.py
index 8b53d147..d0ce8343 100644
--- a/flox/aggregations.py
+++ b/flox/aggregations.py
@@ -372,7 +372,8 @@ def var_chunk(
     )
 
     # Calculate sum squared deviations - the main part of variance sum
-    array_means = array_sums / array_lens
+    with np.errstate(invalid="ignore", divide="ignore"):
+        array_means = array_sums / array_lens
 
     sum_squared_deviations = generic_aggregate(
         group_idx,
@@ -423,15 +424,16 @@ def clip_first(array, ax, n=1):
         zero_denominator = (clip_last(cumsum_len, ax) == 0) | (clip_first(sum_len, ax) == 0)
 
         # Adjustment terms to tweak the sum of squared deviations because not every chunk has the same mean
-        adj_terms = (
-            clip_last(cumsum_len, ax) * clip_first(sum_X, ax)
-            - clip_first(sum_len, ax) * clip_last(cumsum_X, ax)
-        ) ** 2 / (
-            clip_last(cumsum_len, ax)
-            * clip_first(sum_len, ax)
-            * (clip_last(cumsum_len, ax) + clip_first(sum_len, ax))
-            + zero_denominator.astype(int)
-        )
+        with np.errstate(invalid="ignore", divide="ignore"):
+            adj_terms = (
+                clip_last(cumsum_len, ax) * clip_first(sum_X, ax)
+                - clip_first(sum_len, ax) * clip_last(cumsum_X, ax)
+            ) ** 2 / (
+                clip_last(cumsum_len, ax)
+                * clip_first(sum_len, ax)
+                * (clip_last(cumsum_len, ax) + clip_first(sum_len, ax))
+                + zero_denominator.astype(int)
+            )
 
         check = adj_terms * zero_denominator
         assert np.all(check[notnull(check)] == 0), (
@@ -456,9 +458,12 @@ def is_var_chunk_reduction(agg: Callable) -> bool:
 
 
 def _var_finalize(multiarray, ddof=0):
-    den = multiarray.arrays[2] - ddof
+    den = multiarray.arrays[2]
+    den -= ddof
     # preserve nans for groups with 0 obs; so these values are -ddof
-    ret = multiarray.arrays[0] / den
+    with np.errstate(invalid="ignore", divide="ignore"):
+        ret = multiarray.arrays[0]
+        ret /= den
     ret[den < 0] = np.nan
     return ret
 
diff --git a/tests/test_properties.py b/tests/test_properties.py
index a8542afd..86142afc 100644
--- a/tests/test_properties.py
+++ b/tests/test_properties.py
@@ -68,6 +68,8 @@ def not_overflowing_array(array: np.ndarray[Any, Any]) -> bool:
         array = array.view(np.int64)
     array = array.ravel()
     array = array[notnull(array)]
+    if array.size == 0:
+        return True
 
     if array.dtype.kind == "f":
         info = np.finfo(array.dtype)