accept both string and sequence types for reduce_ops parameter in reduce_events() (#45)

janosh · web-flow · commit 04a87534566e · 2025-06-04T08:42:49.000-04:00
- add parameterized test for str and list equivalence of reduce_ops in `test_reduce_events`
- bump pre-commit hooks
- remove duplicate typos pre-commit hook
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -8,7 +8,7 @@ default_install_hook_types: [pre-commit, commit-msg]
 
 repos:
   - repo: https://github.com/astral-sh/ruff-pre-commit
-    rev: v0.11.8
+    rev: v0.11.12
     hooks:
       - id: ruff
         args: [--fix]
@@ -48,12 +48,6 @@ repos:
       - id: nbstripout
         args: [--drop-empty-cells, --keep-output]
 
-  - repo: https://github.com/crate-ci/typos
-    rev: v1.32.0
-    hooks:
-      - id: typos
-        exclude_types: [bib]
-
   - repo: local
     hooks:
       - id: ty
diff --git a/tensorboard_reducer/reduce.py b/tensorboard_reducer/reduce.py
@@ -10,7 +10,7 @@
 
 def reduce_events(
     events_dict: dict[str, pd.DataFrame],
-    reduce_ops: Sequence[str],
+    reduce_ops: str | Sequence[str],
     *,
     verbose: bool = False,
 ) -> dict[str, dict[str, pd.DataFrame]]:
@@ -22,14 +22,19 @@ def reduce_events(
 
     Args:
         events_dict (dict[str, pd.DataFrame]): Dict of arrays to reduce.
-        reduce_ops (list[str]): Names of numpy reduce ops. E.g. mean, std, min, max, ...
+        reduce_ops (str | list[str]): Names of numpy reduce ops. E.g. mean, std, min,
+            max, ... Can be a single string or a sequence of strings.
         verbose (bool, optional): Whether to print progress. Defaults to False.
 
     Returns:
         dict[str, dict[str, pd.DataFrame]]: Dict of dicts where each subdict holds one
             reduced array for each of the specified reduce ops, e.g.
             {"loss": {"mean": arr.mean(-1), "std": arr.std(-1)}}.
     """
+    # Handle case where reduce_ops is a single string
+    if isinstance(reduce_ops, str):
+        reduce_ops = [reduce_ops]
+
     reductions: dict[str, dict[str, pd.DataFrame]] = {}
 
     for op in reduce_ops:
diff --git a/tests/test_reduce.py b/tests/test_reduce.py
@@ -15,6 +15,7 @@
 def generate_sample_data(
     n_tags: int = 1, n_runs: int = 10, n_steps: int = 5
 ) -> dict[str, pd.DataFrame]:
+    """Generate sample test data for testing reduce operations."""
     events_dict = {}
     rng = np.random.default_rng()
     for idx in range(n_tags):
@@ -32,6 +33,7 @@ def test_reduce_events(
     verbose: bool,
     capsys: pytest.CaptureFixture[str],
 ) -> None:
+    """Test reduce_events with sequence of operations."""
     reduced_events = reduce_events(events_dict, reduce_ops, verbose=verbose)
 
     out_keys = list(reduced_events)
@@ -41,17 +43,17 @@ def test_reduce_events(
     )
 
     # loop over reduce operations
-    for (op, out_dict), in_arr in zip(
-        reduced_events.items(), events_dict.values(), strict=True
-    ):
-        n_steps = len(in_arr)  # length of TB logs
+    for op in reduce_ops:
+        out_dict = reduced_events[op]
 
-        # loop over event tags (only 'strict/foo' here)
+        # loop over event tags (e.g., 'strict/foo')
         for tag, out_arr in out_dict.items():
             assert tag in events_dict, (
                 f"unexpected key {tag} in reduced event dict[{op}] = {list(out_dict)}"
             )
 
+            in_arr = events_dict[tag]
+            n_steps = len(in_arr)  # length of TB logs
             out_steps = len(out_arr)
 
             assert n_steps == out_steps, (
@@ -76,8 +78,36 @@ def test_reduce_events(
         assert stdout == ""
 
 
+@pytest.mark.parametrize("reduce_op", ["mean", "std", "max"])
+def test_reduce_events_reduce_op_str_list_equivalence(reduce_op: str) -> None:
+    """Test string input (fixes issue #44) and equivalence with list input."""
+    events_dict = generate_sample_data(n_tags=2, n_runs=3, n_steps=4)
+
+    # Test string input
+    result_string = reduce_events(events_dict, reduce_op)
+
+    # Test list input
+    result_list = reduce_events(events_dict, [reduce_op])
+
+    # Verify string input structure and correctness
+    assert len(result_string) == 1
+    assert reduce_op in result_string
+    for tag, df in events_dict.items():
+        assert tag in result_string[reduce_op]
+        expected = getattr(df, reduce_op)(axis=1)
+        pd.testing.assert_series_equal(result_string[reduce_op][tag], expected)
+
+    # Verify string and list inputs produce identical results
+    assert result_string.keys() == result_list.keys()
+    for tag in events_dict:
+        pd.testing.assert_series_equal(
+            result_string[reduce_op][tag], result_list[reduce_op][tag]
+        )
+
+
 @pytest.mark.parametrize("n_tags, n_runs, n_steps", [(1, 10, 5), (2, 5, 3), (3, 3, 10)])
 def test_reduce_events_dimensions(n_tags: int, n_runs: int, n_steps: int) -> None:
+    """Test reduce_events with different data dimensions."""
     events_dict = generate_sample_data(n_tags=n_tags, n_runs=n_runs, n_steps=n_steps)
     reduce_ops = ["mean", "std", "max", "min"]
     reduced_events = reduce_events(events_dict, reduce_ops)
@@ -97,5 +127,6 @@ def test_reduce_events_dimensions(n_tags: int, n_runs: int, n_steps: int) -> Non
 
 @pytest.mark.parametrize("reduce_ops", [["mean"], ["max", "min"], ["std", "median"]])
 def test_reduce_events_empty_input(reduce_ops: Sequence[str]) -> None:
+    """Test reduce_events with empty input dictionary."""
     reduced_events = reduce_events({}, reduce_ops)
     assert reduced_events == {op: {} for op in reduce_ops}