ml31415
diff --git a/‎conftest.py
Lines changed: 3 additions & 1 deletion b/‎conftest.py
Lines changed: 3 additions & 1 deletion
diff --git a/‎numpy_groupies/aggregate_numba.py
Lines changed: 26 additions & 7 deletions b/‎numpy_groupies/aggregate_numba.py
Lines changed: 26 additions & 7 deletions
diff --git a/‎numpy_groupies/aggregate_numpy.py
Lines changed: 43 additions & 11 deletions b/‎numpy_groupies/aggregate_numpy.py
Lines changed: 43 additions & 11 deletions
diff --git a/‎numpy_groupies/aggregate_numpy_ufunc.py
Lines changed: 11 additions & 1 deletion b/‎numpy_groupies/aggregate_numpy_ufunc.py
Lines changed: 11 additions & 1 deletion
diff --git a/‎numpy_groupies/aggregate_pandas.py
Lines changed: 15 additions & 3 deletions b/‎numpy_groupies/aggregate_pandas.py
Lines changed: 15 additions & 3 deletions
diff --git a/‎numpy_groupies/aggregate_purepy.py
Lines changed: 34 additions & 8 deletions b/‎numpy_groupies/aggregate_purepy.py
Lines changed: 34 additions & 8 deletions
@@ -5,7 +5,9 @@
 
 
 def pytest_configure(config):
-    config.addinivalue_line("markers", "deselect_if(func): function to deselect tests from parametrization")
+    config.addinivalue_line(
+        "markers", "deselect_if(func): function to deselect tests from parametrization"
+    )
 
 
 def pytest_collection_modifyitems(config, items):
 
@@ -68,7 +68,9 @@ def __call__(
         dtype = check_dtype(dtype, self.func, a, len(group_idx))
         check_fill_value(fill_value, dtype, func=self.func)
         input_dtype = type(a) if np.isscalar(a) else a.dtype
-        ret, counter, mean, outer = self._initialize(flat_size, fill_value, dtype, input_dtype, group_idx.size)
+        ret, counter, mean, outer = self._initialize(
+            flat_size, fill_value, dtype, input_dtype, group_idx.size
+        )
         group_idx = np.ascontiguousarray(group_idx)
 
         if not np.isscalar(a):
@@ -141,7 +143,9 @@ def inner(ri, val, ret, counter, mean, fill_value):
         def loop(group_idx, a, ret, counter, mean, outer, fill_value, ddof):
             # ddof needs to be present for being exchangeable with loop_2pass
             size = len(ret)
-            rng = range(len(group_idx) - 1, -1, -1) if reverse else range(len(group_idx))
+            rng = (
+                range(len(group_idx) - 1, -1, -1) if reverse else range(len(group_idx))
+            )
             for i in rng:
                 ri = group_idx[i]
                 if ri < 0:
@@ -242,14 +246,18 @@ def __call__(
         axis=None,
         ddof=0,
     ):
-        iv = input_validation(group_idx, a, size=size, order=order, axis=axis, check_bounds=False)
+        iv = input_validation(
+            group_idx, a, size=size, order=order, axis=axis, check_bounds=False
+        )
         group_idx, a, flat_size, ndim_idx, size, _ = iv
 
         # TODO: The typecheck should be done by the class itself, not by check_dtype
         dtype = check_dtype(dtype, self.func, a, len(group_idx))
         check_fill_value(fill_value, dtype, func=self.func)
         input_dtype = type(a) if np.isscalar(a) else a.dtype
-        ret, _, _, _ = self._initialize(flat_size, fill_value, dtype, input_dtype, group_idx.size)
+        ret, _, _, _ = self._initialize(
+            flat_size, fill_value, dtype, input_dtype, group_idx.size
+        )
         group_idx = np.ascontiguousarray(group_idx)
 
         sortidx = np.argsort(group_idx, kind="mergesort")
@@ -493,7 +501,7 @@ class CumMin(AggregateNtoN, Min):
 
 
 def get_funcs():
-    funcs = dict()
+    funcs = {}
     for op in (
         Sum,
         Prod,
@@ -530,7 +538,16 @@ def get_funcs():
 
 
 def aggregate(
-    group_idx, a, func="sum", size=None, fill_value=0, order="C", dtype=None, axis=None, cache=True, **kwargs
+    group_idx,
+    a,
+    func="sum",
+    size=None,
+    fill_value=0,
+    order="C",
+    dtype=None,
+    axis=None,
+    cache=True,
+    **kwargs,
 ):
     func = get_func(func, aliasing, _impl_dict)
     if not isinstance(func, str):
@@ -541,7 +558,9 @@ def aggregate(
             if cache is True:
                 cache = _default_cache
             aggregate_op = cache.setdefault(func, AggregateGeneric(func))
-        return aggregate_op(group_idx, a, size, fill_value, order, dtype, axis, **kwargs)
+        return aggregate_op(
+            group_idx, a, size, fill_value, order, dtype, axis, **kwargs
+        )
     else:
         func = _impl_dict[func]
         return func(group_idx, a, size, fill_value, order, dtype, axis, **kwargs)
 
@@ -30,7 +30,9 @@ def _sum(group_idx, a, size, fill_value, dtype=None):
             ret.real = np.bincount(group_idx, weights=a.real, minlength=size)
             ret.imag = np.bincount(group_idx, weights=a.imag, minlength=size)
         else:
-            ret = np.bincount(group_idx, weights=a, minlength=size).astype(dtype, copy=False)
+            ret = np.bincount(group_idx, weights=a, minlength=size).astype(
+                dtype, copy=False
+            )
 
     if fill_value != 0:
         _fill_untouched(group_idx, ret, fill_value)
@@ -117,7 +119,9 @@ def _argmax(group_idx, a, size, fill_value, dtype=int, _nansqueeze=False):
     ret = np.full(size, fill_value, dtype=dtype)
     group_idx_max = group_idx[is_max]
     (argmax,) = is_max.nonzero()
-    ret[group_idx_max[::-1]] = argmax[::-1]  # reverse to ensure first value for each group wins
+    ret[group_idx_max[::-1]] = argmax[
+        ::-1
+    ]  # reverse to ensure first value for each group wins
     return ret
 
 
@@ -129,7 +133,9 @@ def _argmin(group_idx, a, size, fill_value, dtype=int, _nansqueeze=False):
     ret = np.full(size, fill_value, dtype=dtype)
     group_idx_min = group_idx[is_min]
     (argmin,) = is_min.nonzero()
-    ret[group_idx_min[::-1]] = argmin[::-1]  # reverse to ensure first value for each group wins
+    ret[group_idx_min[::-1]] = argmin[
+        ::-1
+    ]  # reverse to ensure first value for each group wins
     return ret
 
 
@@ -143,7 +149,9 @@ def _mean(group_idx, a, size, fill_value, dtype=np.dtype(np.float64)):
         sums.real = np.bincount(group_idx, weights=a.real, minlength=size)
         sums.imag = np.bincount(group_idx, weights=a.imag, minlength=size)
     else:
-        sums = np.bincount(group_idx, weights=a, minlength=size).astype(dtype, copy=False)
+        sums = np.bincount(group_idx, weights=a, minlength=size).astype(
+            dtype, copy=False
+        )
 
     with np.errstate(divide="ignore", invalid="ignore"):
         ret = sums.astype(dtype, copy=False) / counts
@@ -160,15 +168,19 @@ def _sum_of_squres(group_idx, a, size, fill_value, dtype=np.dtype(np.float64)):
     return ret
 
 
-def _var(group_idx, a, size, fill_value, dtype=np.dtype(np.float64), sqrt=False, ddof=0):
+def _var(
+    group_idx, a, size, fill_value, dtype=np.dtype(np.float64), sqrt=False, ddof=0
+):
     if np.ndim(a) == 0:
         raise ValueError("cannot take variance with scalar a")
     counts = np.bincount(group_idx, minlength=size)
     sums = np.bincount(group_idx, weights=a, minlength=size)
     with np.errstate(divide="ignore", invalid="ignore"):
         means = sums.astype(dtype, copy=False) / counts
         counts = np.where(counts > ddof, counts - ddof, 0)
-        ret = np.bincount(group_idx, (a - means[group_idx]) ** 2, minlength=size) / counts
+        ret = (
+            np.bincount(group_idx, (a - means[group_idx]) ** 2, minlength=size) / counts
+        )
     if sqrt:
         ret = np.sqrt(ret)  # this is now std not var
     if not np.isnan(fill_value):
@@ -208,7 +220,9 @@ def _array(group_idx, a, size, fill_value, dtype=None):
     return ret
 
 
-def _generic_callable(group_idx, a, size, fill_value, dtype=None, func=lambda g: g, **kwargs):
+def _generic_callable(
+    group_idx, a, size, fill_value, dtype=None, func=lambda g: g, **kwargs
+):
     """groups a by inds, and then applies foo to each group in turn, placing
     the results in an array."""
     groups = _array(group_idx, a, size, ())
@@ -244,7 +258,9 @@ def _cumsum(group_idx, a, size, fill_value=None, dtype=None):
 
 def _nancumsum(group_idx, a, size, fill_value=None, dtype=None):
     a_nonans = np.where(np.isnan(a), 0, a)
-    group_idx_nonans = np.where(np.isnan(group_idx), np.nanmax(group_idx) + 1, group_idx)
+    group_idx_nonans = np.where(
+        np.isnan(group_idx), np.nanmax(group_idx) + 1, group_idx
+    )
     return _cumsum(group_idx_nonans, a_nonans, size, fill_value=fill_value, dtype=dtype)
 
 
@@ -271,7 +287,11 @@ def _nancumsum(group_idx, a, size, fill_value=None, dtype=None):
     sumofsquares=_sum_of_squres,
     generic=_generic_callable,
 )
-_impl_dict.update(("nan" + k, v) for k, v in list(_impl_dict.items()) if k not in funcs_no_separate_nan)
+_impl_dict.update(
+    ("nan" + k, v)
+    for k, v in list(_impl_dict.items())
+    if k not in funcs_no_separate_nan
+)
 _impl_dict["nancumsum"] = _nancumsum
 
 
@@ -321,7 +341,9 @@ def _aggregate_base(
         dtype = check_dtype(dtype, func, a, flat_size)
         check_fill_value(fill_value, dtype, func=func)
         func = _impl_dict[func]
-        ret = func(group_idx, a, flat_size, fill_value=fill_value, dtype=dtype, **kwargs)
+        ret = func(
+            group_idx, a, flat_size, fill_value=fill_value, dtype=dtype, **kwargs
+        )
 
     # deal with ndimensional indexing
     if ndim_idx > 1:
@@ -335,7 +357,17 @@ def _aggregate_base(
     return ret
 
 
-def aggregate(group_idx, a, func="sum", size=None, fill_value=0, order="C", dtype=None, axis=None, **kwargs):
+def aggregate(
+    group_idx,
+    a,
+    func="sum",
+    size=None,
+    fill_value=0,
+    order="C",
+    dtype=None,
+    axis=None,
+    **kwargs,
+):
     return _aggregate_base(
         group_idx,
         a,
 
@@ -97,7 +97,17 @@ def _max(group_idx, a, size, fill_value, dtype=None):
 )
 
 
-def aggregate(group_idx, a, func="sum", size=None, fill_value=0, order="C", dtype=None, axis=None, **kwargs):
+def aggregate(
+    group_idx,
+    a,
+    func="sum",
+    size=None,
+    fill_value=0,
+    order="C",
+    dtype=None,
+    axis=None,
+    **kwargs,
+):
     func = get_func(func, aliasing, _impl_dict)
     if not isinstance(func, str):
         raise NotImplementedError("No such ufunc available")
 
@@ -15,7 +15,7 @@
 
 def _wrapper(group_idx, a, size, fill_value, func="sum", dtype=None, ddof=0, **kwargs):
     funcname = func.__name__ if callable(func) else func
-    kwargs = dict()
+    kwargs = {}
     if funcname in ("var", "std"):
         kwargs["ddof"] = ddof
     df = pd.DataFrame({"group_idx": group_idx, "a": a})
@@ -37,7 +37,9 @@ def _wrapper(group_idx, a, size, fill_value, func="sum", dtype=None, ddof=0, **k
 _supported_funcs = "sum prod all any min max mean var std first last cumsum cumprod cummax cummin".split()
 _impl_dict = {fn: partial(_wrapper, func=fn) for fn in _supported_funcs}
 _impl_dict.update(
-    ("nan" + fn, partial(_wrapper, func=fn)) for fn in _supported_funcs if fn not in funcs_no_separate_nan
+    ("nan" + fn, partial(_wrapper, func=fn))
+    for fn in _supported_funcs
+    if fn not in funcs_no_separate_nan
 )
 _impl_dict.update(
     allnan=partial(_wrapper, func=allnan),
@@ -52,7 +54,17 @@ def _wrapper(group_idx, a, size, fill_value, func="sum", dtype=None, ddof=0, **k
 )
 
 
-def aggregate(group_idx, a, func="sum", size=None, fill_value=0, order="C", dtype=None, axis=None, **kwargs):
+def aggregate(
+    group_idx,
+    a,
+    func="sum",
+    size=None,
+    fill_value=0,
+    order="C",
+    dtype=None,
+    axis=None,
+    **kwargs,
+):
     return _aggregate_base(
         group_idx,
         a,
 
@@ -67,7 +67,9 @@ def _sort(group_idx, a, reverse=False):
     def _argsort(unordered):
         return sorted(range(len(unordered)), key=lambda k: unordered[k])
 
-    sortidx = _argsort(list((gi, aj) for gi, aj in zip(group_idx, -a if reverse else a)))
+    sortidx = _argsort(
+        list((gi, aj) for gi, aj in zip(group_idx, -a if reverse else a))
+    )
     revidx = _argsort(_argsort(group_idx))
     a_srt = [a[si] for si in sortidx]
     return [a_srt[ri] for ri in revidx]
@@ -93,10 +95,24 @@ def _argsort(unordered):
     argmin=_argmin,
     len=len,
 )
-_impl_dict.update(("nan" + k, v) for k, v in list(_impl_dict.items()) if k not in funcs_no_separate_nan)
+_impl_dict.update(
+    ("nan" + k, v)
+    for k, v in list(_impl_dict.items())
+    if k not in funcs_no_separate_nan
+)
 
 
-def aggregate(group_idx, a, func="sum", size=None, fill_value=0, order=None, dtype=None, axis=None, **kwargs):
+def aggregate(
+    group_idx,
+    a,
+    func="sum",
+    size=None,
+    fill_value=0,
+    order=None,
+    dtype=None,
+    axis=None,
+    **kwargs,
+):
     if axis is not None:
         raise NotImplementedError("axis arg not supported in purepy implementation.")
 
@@ -105,29 +121,37 @@ def aggregate(group_idx, a, func="sum", size=None, fill_value=0, order=None, dty
         try:
             size = 1 + int(max(group_idx))
         except (TypeError, ValueError):
-            raise NotImplementedError("pure python implementation doesn't accept ndim idx input.")
+            raise NotImplementedError(
+                "pure python implementation doesn't accept ndim idx input."
+            )
 
     for i in group_idx:
         try:
             i = int(i)
         except (TypeError, ValueError):
             if isinstance(i, (list, tuple)):
-                raise NotImplementedError("pure python implementation doesn't accept ndim idx input.")
+                raise NotImplementedError(
+                    "pure python implementation doesn't accept ndim idx input."
+                )
             else:
                 try:
                     len(i)
                 except TypeError:
                     raise ValueError(f"invalid value found in group_idx: {i}")
                 else:
-                    raise NotImplementedError("pure python implementation doesn't accept ndim indexed input.")
+                    raise NotImplementedError(
+                        "pure python implementation doesn't accept ndim indexed input."
+                    )
         else:
             if i < 0:
                 raise ValueError("group_idx contains negative value")
 
     func = get_func(func, aliasing, _impl_dict)
     if isinstance(a, (int, float)):
         if func not in ("sum", "prod", "len"):
-            raise ValueError("scalar inputs are supported only for 'sum', 'prod' and 'len'")
+            raise ValueError(
+                "scalar inputs are supported only for 'sum', 'prod' and 'len'"
+            )
         a = [a] * len(group_idx)
     elif len(group_idx) != len(a):
         raise ValueError("group_idx and a must be of the same length")
@@ -136,7 +160,9 @@ def aggregate(group_idx, a, func="sum", size=None, fill_value=0, order=None, dty
         if func.startswith("nan"):
             func = func[3:]
             # remove nans
-            group_idx, a = zip(*((ix, val) for ix, val in zip(group_idx, a) if not math.isnan(val)))
+            group_idx, a = zip(
+                *((ix, val) for ix, val in zip(group_idx, a) if not math.isnan(val))
+            )
 
         func = _impl_dict[func]
     if func is _sort: