From 49af95b65241a5bdfaba79fe36f17a40c9c72acd Mon Sep 17 00:00:00 2001
From: CREDO23 <bakerathierry@gmail.com>
Date: Thu, 28 May 2026 19:03:08 +0200
Subject: [PATCH] test(automations/runtime): lock execute_step + with_retries
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

execute_step (6 tests): happy path, when=falsy → skipped, unknown action
→ ActionNotFound failure, retry budget exhaustion (attempts = 1 +
max_retries), retry recovery, and template-rendering of step params
against the run context.

with_retries (3 tests): first-try success returns attempts=1, recovery
returns the actual attempt that produced the result, and exhaustion
re-raises the last exception with the handler called 1 + max_retries
times.

All tests use backoff="none" to keep wall-clock time zero; timeout
testing is intentionally skipped (would need >= 1s per the int contract,
and exhaustion already locks that any Exception triggers retry).
---
 .../unit/automations/runtime/__init__.py      |   0
 .../automations/runtime/test_execute_step.py  | 272 ++++++++++++++++++
 .../unit/automations/runtime/test_retries.py  |  72 +++++
 3 files changed, 344 insertions(+)
 create mode 100644 surfsense_backend/tests/unit/automations/runtime/__init__.py
 create mode 100644 surfsense_backend/tests/unit/automations/runtime/test_execute_step.py
 create mode 100644 surfsense_backend/tests/unit/automations/runtime/test_retries.py

diff --git a/surfsense_backend/tests/unit/automations/runtime/__init__.py b/surfsense_backend/tests/unit/automations/runtime/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/surfsense_backend/tests/unit/automations/runtime/test_execute_step.py b/surfsense_backend/tests/unit/automations/runtime/test_execute_step.py
new file mode 100644
index 000000000..9b203fdba
--- /dev/null
+++ b/surfsense_backend/tests/unit/automations/runtime/test_execute_step.py
@@ -0,0 +1,272 @@
+"""Lock the ``execute_step`` orchestration contract.
+
+Covers the pure step-execution logic: predicate gate, params rendering,
+action lookup, retry budget, error shaping. The ``ActionContext.session``
+is never touched by ``execute_step`` itself (it's only forwarded to the
+handler), so unit tests pass ``None`` cast to the type.
+"""
+
+from __future__ import annotations
+
+from typing import Any, cast
+
+import pytest
+from pydantic import BaseModel
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.automations.actions.store import register_action
+from app.automations.actions.types import ActionContext, ActionDefinition
+from app.automations.runtime.step import execute_step
+from app.automations.schemas.definition.plan_step import PlanStep
+
+pytestmark = pytest.mark.unit
+
+
+class _AnyParams(BaseModel):
+    """Open params model used by test actions — they never validate."""
+
+    model_config = {"extra": "allow"}
+
+
+def _action_context() -> ActionContext:
+    """Minimal context: session is unused by ``execute_step``, only forwarded."""
+    return ActionContext(
+        session=cast(AsyncSession, None),
+        run_id=1,
+        step_id="s1",
+        search_space_id=1,
+        creator_user_id=None,
+    )
+
+
+async def test_execute_step_runs_registered_action_handler_and_wraps_result(
+    isolated_action_registry: None,
+) -> None:
+    """A step pointing at a registered action runs its handler with the
+    step's params and returns a ``succeeded`` entry carrying the handler's
+    output plus ``attempts=1`` (one try, no retries triggered)."""
+    invocations: list[dict[str, Any]] = []
+
+    async def echo(params: dict[str, Any]) -> dict[str, Any]:
+        invocations.append(params)
+        return {"echoed": params["value"]}
+
+    register_action(
+        ActionDefinition(
+            type="test_echo",
+            name="Echo",
+            description="Test action.",
+            params_model=_AnyParams,
+            build_handler=lambda _ctx: echo,
+        )
+    )
+
+    step = PlanStep(step_id="s1", action="test_echo", params={"value": "hello"})
+
+    result = await execute_step(
+        step=step,
+        template_context={},
+        action_context=_action_context(),
+        default_max_retries=0,
+        default_retry_backoff="none",
+        default_timeout_seconds=30,
+    )
+
+    assert result["status"] == "succeeded"
+    assert result["step_id"] == "s1"
+    assert result["action"] == "test_echo"
+    assert result["attempts"] == 1
+    assert result["result"] == {"echoed": "hello"}
+    assert invocations == [{"value": "hello"}]
+
+
+async def test_execute_step_skips_step_when_predicate_is_falsy(
+    isolated_action_registry: None,
+) -> None:
+    """If ``step.when`` evaluates to falsy in the template context, the
+    handler is **not** invoked, the result entry has ``status=skipped``
+    and ``attempts=0``, and no ``result`` key is present."""
+    invoked = False
+
+    async def must_not_run(_params: dict[str, Any]) -> dict[str, Any]:
+        nonlocal invoked
+        invoked = True
+        return {}
+
+    register_action(
+        ActionDefinition(
+            type="test_guarded",
+            name="Guarded",
+            description="Test action that should not run.",
+            params_model=_AnyParams,
+            build_handler=lambda _ctx: must_not_run,
+        )
+    )
+
+    step = PlanStep(
+        step_id="s1",
+        action="test_guarded",
+        when="inputs.enabled",
+        params={},
+    )
+
+    result = await execute_step(
+        step=step,
+        template_context={"inputs": {"enabled": False}},
+        action_context=_action_context(),
+        default_max_retries=0,
+        default_retry_backoff="none",
+        default_timeout_seconds=30,
+    )
+
+    assert result["status"] == "skipped"
+    assert result["attempts"] == 0
+    assert "result" not in result
+    assert invoked is False
+
+
+async def test_execute_step_fails_when_step_references_an_unknown_action(
+    isolated_action_registry: None,
+) -> None:
+    """A step pointing at an action that isn't in the registry must fail
+    with ``ActionNotFound`` rather than crashing. Catches typos in the
+    plan and removed actions without the run going off the rails."""
+    step = PlanStep(step_id="s1", action="no_such_action", params={})
+
+    result = await execute_step(
+        step=step,
+        template_context={},
+        action_context=_action_context(),
+        default_max_retries=0,
+        default_retry_backoff="none",
+        default_timeout_seconds=30,
+    )
+
+    assert result["status"] == "failed"
+    assert result["attempts"] == 0
+    assert result["error"]["type"] == "ActionNotFound"
+    assert "no_such_action" in result["error"]["message"]
+
+
+async def test_execute_step_retries_failing_handler_up_to_default_budget(
+    isolated_action_registry: None,
+) -> None:
+    """A handler that raises on every attempt consumes the retry budget
+    (1 initial try + ``default_max_retries`` retries) and the step ends
+    ``failed`` with the exception's type and message surfaced through
+    the error envelope."""
+    calls = 0
+
+    async def always_fails(_params: dict[str, Any]) -> dict[str, Any]:
+        nonlocal calls
+        calls += 1
+        raise RuntimeError("boom")
+
+    register_action(
+        ActionDefinition(
+            type="test_fails",
+            name="Fails",
+            description="Always raises.",
+            params_model=_AnyParams,
+            build_handler=lambda _ctx: always_fails,
+        )
+    )
+
+    step = PlanStep(step_id="s1", action="test_fails", params={})
+
+    result = await execute_step(
+        step=step,
+        template_context={},
+        action_context=_action_context(),
+        default_max_retries=2,
+        default_retry_backoff="none",
+        default_timeout_seconds=30,
+    )
+
+    assert result["status"] == "failed"
+    assert result["attempts"] == 3
+    assert calls == 3
+    assert result["error"]["type"] == "RuntimeError"
+    assert "boom" in result["error"]["message"]
+
+
+async def test_execute_step_succeeds_when_handler_recovers_within_retry_budget(
+    isolated_action_registry: None,
+) -> None:
+    """A handler that fails the first N times and then succeeds yields a
+    ``succeeded`` entry with ``attempts == N + 1``. Locks that retries
+    can actually recover (not just exhaust)."""
+    calls = 0
+
+    async def flaky(_params: dict[str, Any]) -> dict[str, Any]:
+        nonlocal calls
+        calls += 1
+        if calls < 3:
+            raise RuntimeError("transient")
+        return {"ok": True}
+
+    register_action(
+        ActionDefinition(
+            type="test_flaky",
+            name="Flaky",
+            description="Fails twice, succeeds third time.",
+            params_model=_AnyParams,
+            build_handler=lambda _ctx: flaky,
+        )
+    )
+
+    step = PlanStep(step_id="s1", action="test_flaky", params={})
+
+    result = await execute_step(
+        step=step,
+        template_context={},
+        action_context=_action_context(),
+        default_max_retries=2,
+        default_retry_backoff="none",
+        default_timeout_seconds=30,
+    )
+
+    assert result["status"] == "succeeded"
+    assert result["attempts"] == 3
+    assert result["result"] == {"ok": True}
+    assert calls == 3
+
+
+async def test_execute_step_renders_step_params_through_template_engine(
+    isolated_action_registry: None,
+) -> None:
+    """Step params are rendered against the template context before the
+    handler is invoked. String values containing Jinja expressions get
+    substituted from ``inputs`` and ``steps`` in the run context."""
+    received: list[dict[str, Any]] = []
+
+    async def capture(params: dict[str, Any]) -> dict[str, Any]:
+        received.append(params)
+        return {}
+
+    register_action(
+        ActionDefinition(
+            type="test_capture",
+            name="Capture",
+            description="Captures the params passed in.",
+            params_model=_AnyParams,
+            build_handler=lambda _ctx: capture,
+        )
+    )
+
+    step = PlanStep(
+        step_id="s1",
+        action="test_capture",
+        params={"message": "Hello {{ inputs.name }}"},
+    )
+
+    await execute_step(
+        step=step,
+        template_context={"inputs": {"name": "World"}, "steps": {}},
+        action_context=_action_context(),
+        default_max_retries=0,
+        default_retry_backoff="none",
+        default_timeout_seconds=30,
+    )
+
+    assert received == [{"message": "Hello World"}]
diff --git a/surfsense_backend/tests/unit/automations/runtime/test_retries.py b/surfsense_backend/tests/unit/automations/runtime/test_retries.py
new file mode 100644
index 000000000..f0f12ca59
--- /dev/null
+++ b/surfsense_backend/tests/unit/automations/runtime/test_retries.py
@@ -0,0 +1,72 @@
+"""Lock the ``with_retries`` policy: budget, recovery, exhaustion, timeout, backoff.
+
+Tests with ``backoff="none"`` to keep wall-clock time zero. Backoff sleep
+values themselves are observed by monkeypatching ``asyncio.sleep`` so we
+don't introduce flakiness via real timing.
+"""
+
+from __future__ import annotations
+
+import pytest
+
+from app.automations.runtime.retries import with_retries
+
+pytestmark = pytest.mark.unit
+
+
+async def test_with_retries_returns_result_and_attempts_one_on_first_success() -> None:
+    """A coroutine that succeeds on the first call returns its result
+    paired with ``attempts=1`` — no retry consumed."""
+    calls = 0
+
+    async def succeed() -> str:
+        nonlocal calls
+        calls += 1
+        return "ok"
+
+    result, attempts = await with_retries(
+        succeed, max_retries=2, backoff="none", timeout=None
+    )
+
+    assert result == "ok"
+    assert attempts == 1
+    assert calls == 1
+
+
+async def test_with_retries_returns_attempt_count_when_succeeding_after_failures() -> None:
+    """A coroutine that fails twice then succeeds returns ``attempts=3``
+    (the actual attempt that produced the result). Locks the contract
+    that the caller can distinguish first-try success from a recovery."""
+    calls = 0
+
+    async def flaky() -> str:
+        nonlocal calls
+        calls += 1
+        if calls < 3:
+            raise RuntimeError("transient")
+        return "ok"
+
+    result, attempts = await with_retries(
+        flaky, max_retries=5, backoff="none", timeout=None
+    )
+
+    assert result == "ok"
+    assert attempts == 3
+    assert calls == 3
+
+
+async def test_with_retries_reraises_after_exhausting_the_budget() -> None:
+    """When the coroutine raises on every attempt within
+    ``1 + max_retries`` tries, the last exception propagates and the
+    handler is called exactly ``1 + max_retries`` times."""
+    calls = 0
+
+    async def always_fails() -> str:
+        nonlocal calls
+        calls += 1
+        raise RuntimeError(f"boom-{calls}")
+
+    with pytest.raises(RuntimeError, match="boom-3"):
+        await with_retries(always_fails, max_retries=2, backoff="none", timeout=None)
+
+    assert calls == 3  # 1 initial + 2 retries