feat: pyarrow Series.sum (#495)

* Feat: Series.sum test case * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * test_series_sum refactoring * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * fixing according to standard * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * refactoring code to satisfy code criteria * Fixing Series.sum functionality for Pyarrow DF * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Fixing compare mistake on Series.sum for Pyarrow * cleaning up code * removing 'pyarrow_table' from test_sum_all and test_renamed_taxicab * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * making sure CI passes all test cases * all test cases passed on CI --------- Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
narwhals-dev · Jul 15, 2024 · 2bc3a6f · 2bc3a6f
1 parent 721816f
commit 2bc3a6f
Show file tree

Hide file tree

Showing 6 changed files with 32 additions and 11 deletions.
diff --git a/narwhals/_arrow/expr.py b/narwhals/_arrow/expr.py
@@ -165,6 +165,9 @@ def max(self) -> Self:
     def all(self) -> Self:
         return reuse_series_implementation(self, "all", returns_scalar=True)
 
+    def sum(self) -> Self:
+        return reuse_series_implementation(self, "sum", returns_scalar=True)
+
     def alias(self, name: str) -> Self:
         # Define this one manually, so that we can
         # override `output_names` and not increase depth

diff --git a/narwhals/_arrow/series.py b/narwhals/_arrow/series.py
@@ -155,6 +155,10 @@ def max(self) -> int:
         pc = get_pyarrow_compute()
         return pc.max(self._native_series)  # type: ignore[no-any-return]
 
+    def sum(self) -> int:
+        pc = get_pyarrow_compute()
+        return pc.sum(self._native_series)  # type: ignore[no-any-return]
+
     def std(self, ddof: int = 1) -> int:
         pc = get_pyarrow_compute()
         return pc.stddev(self._native_series, ddof=ddof)  # type: ignore[no-any-return]

diff --git a/tests/expr/sum_all_test.py b/tests/expr/sum_all_test.py
@@ -1,15 +1,10 @@
 from typing import Any
 
-import pytest
-
 import narwhals.stable.v1 as nw
 from tests.utils import compare_dicts
 
 
-def test_sum_all(request: Any, constructor: Any) -> None:
-    if "pyarrow_table" in str(constructor):
-        request.applymarker(pytest.mark.xfail)
-
+def test_sum_all(constructor: Any) -> None:
     data = {"a": [1, 3, 2], "b": [4, 4, 6], "z": [7.0, 8, 9]}
     df = nw.from_native(constructor(data), eager_only=True)
     result = df.select(nw.all().sum())

diff --git a/tests/frame/series_sum_test.py b/tests/frame/series_sum_test.py
@@ -0,0 +1,23 @@
+from __future__ import annotations
+
+from typing import Any
+
+import narwhals.stable.v1 as nw
+from tests.utils import compare_dicts
+
+
+def test_series_sum(constructor: Any) -> None:
+    data = {
+        "a": [0, 1, 2, 3, 4],
+        "b": [1, 2, 3, 5, 3],
+        "c": [5, 4, None, 2, 1],
+    }
+    df = nw.from_native(
+        constructor(data), strict=False, eager_only=True, allow_series=True
+    )
+
+    result = df.select(nw.col("a", "b", "c").sum())
+
+    expected_sum = {"a": [10], "b": [14], "c": [12]}
+
+    compare_dicts(result, expected_sum)
diff --git a/tests/stable_api_test.py b/tests/stable_api_test.py
@@ -8,7 +8,7 @@
 from tests.utils import compare_dicts
 
 
-def test_renamed_taxicab_norm(request: Any, constructor: Any) -> None:
+def test_renamed_taxicab_norm(constructor: Any) -> None:
     # Suppose we need to rename `_l1_norm` to `_taxicab_norm`.
     # We need `narwhals.stable.v1` to stay stable. So, we
     # make the change in `narwhals`, and then add the new method
@@ -17,9 +17,6 @@ def test_renamed_taxicab_norm(request: Any, constructor: Any) -> None:
     # API will still be able to use it, without the main namespace
     # getting cluttered by the new name.
 
-    if "pyarrow_table" in str(constructor):
-        request.applymarker(pytest.mark.xfail)
-
     df = nw.from_native(constructor({"a": [1, 2, 3, -4, 5]}))
     result = df.with_columns(b=nw.col("a")._taxicab_norm())
     expected = {"a": [1, 2, 3, -4, 5], "b": [15] * 5}

diff --git a/utils/check_backend_completeness.py b/utils/check_backend_completeness.py
@@ -35,7 +35,6 @@
     "Series.sample",
     "Series.shift",
     "Series.sort",
-    "Series.sum",
     "Series.to_frame",
     "Series.to_pandas",
     "Series.unique",