Initial release: iai-mcp v0.1.0

Co-Authored-By: Claude <noreply@anthropic.com> Co-Authored-By: XNLLLLH <XNLLLLH@users.noreply.github.com>
2026-05-06 01:04:47 -07:00 · 2026-05-06 01:04:47 -07:00 · f6b876fbe7
commit f6b876fbe7
332 changed files with 97258 additions and 0 deletions
--- a/tests/test_batch_api.py
+++ b/tests/test_batch_api.py
@ -0,0 +1,120 @@
+"""Tests for TOK-09 Batch API consolidation (Plan 02-04 Task 3, D-29).
+
+submit_batch_consolidation passes through D-GUARD (should_call_llm) before
+any network work. On Tier 0 fallback (no llm_enabled, no api key, budget
+exceeded, ratelimit cooldown) returns stub results + writes llm_health
+event. scope: the gate + event side-effects are load-bearing;
+the real anthropic.batches.create call is stubbed (SDK surface varies).
+"""
+from __future__ import annotations
+
+import pytest
+
+from iai_mcp.events import query_events
+from iai_mcp.guard import BudgetLedger, RateLimitLedger
+from iai_mcp.store import MemoryStore
+
+
+def _tasks(n: int = 3) -> list[dict]:
+    return [
+        {
+            "task_id": f"t{i}",
+            "prompt": f"summarise cluster {i}",
+            "prompt_tok": 500,
+            "output_tok": 200,
+        }
+        for i in range(n)
+    ]
+
+
+def test_batch_fallback_when_llm_disabled(tmp_path):
+    from iai_mcp.batch import submit_batch_consolidation
+
+    store = MemoryStore(path=tmp_path)
+    budget = BudgetLedger(store)
+    rate = RateLimitLedger(store)
+    ok, reason, results = submit_batch_consolidation(
+        store, _tasks(), budget, rate, llm_enabled=False,
+    )
+    assert ok is False
+    assert "llm_enabled" in reason.lower() or "disabled" in reason.lower()
+    # Fallback returns an empty-but-structured list so downstream consumers
+    # don't crash on a None.
+    assert isinstance(results, list)
+
+
+def test_batch_fallback_when_no_api_key(tmp_path, monkeypatch):
+    from iai_mcp.batch import submit_batch_consolidation
+
+    monkeypatch.delenv("ANTHROPIC_API_KEY", raising=False)
+    store = MemoryStore(path=tmp_path)
+    budget = BudgetLedger(store)
+    rate = RateLimitLedger(store)
+    ok, reason, _ = submit_batch_consolidation(
+        store, _tasks(), budget, rate, llm_enabled=True,
+    )
+    assert ok is False
+    # D-GUARD step 2.
+    assert "api" in reason.lower() or "key" in reason.lower()
+
+
+def test_batch_emits_llm_health_on_fallback(tmp_path):
+    from iai_mcp.batch import submit_batch_consolidation
+
+    store = MemoryStore(path=tmp_path)
+    budget = BudgetLedger(store)
+    rate = RateLimitLedger(store)
+    submit_batch_consolidation(
+        store, _tasks(), budget, rate, llm_enabled=False,
+    )
+    events = query_events(store, kind="llm_health")
+    fallback_events = [
+        e for e in events
+        if e["data"].get("component") == "batch_consolidation"
+    ]
+    assert len(fallback_events) >= 1
+
+
+def test_batch_50pct_discount():
+    """Pricing helper returns 50% of sync cost per D-29."""
+    from iai_mcp.batch import BATCH_DISCOUNT, _sync_tier_cost
+
+    sync = _sync_tier_cost(1_000_000, 1_000_000)
+    # Haiku 4.5 approximate -- not exact numbers, just shape.
+    assert sync > 0
+    discounted = sync * BATCH_DISCOUNT
+    assert discounted == sync * 0.5
+    assert BATCH_DISCOUNT == 0.5
+
+
+def test_batch_records_spend_when_eligible(tmp_path, monkeypatch):
+    """Eligible path records a discounted spend to BudgetLedger."""
+    from iai_mcp.batch import submit_batch_consolidation
+
+    monkeypatch.setenv("ANTHROPIC_API_KEY", "test-key")
+    store = MemoryStore(path=tmp_path)
+    budget = BudgetLedger(store)
+    rate = RateLimitLedger(store)
+    before = budget.daily_used()
+    ok, _reason, _results = submit_batch_consolidation(
+        store, _tasks(5), budget, rate, llm_enabled=True,
+    )
+    after = budget.daily_used()
+    # Whether the SDK is present or not, the eligible gate records a nominal
+    # spend (Plan 02-04 scaffolds the budget side-effect; real batch API is
+    # implemented via mock/stub so tests don't hit the network).
+    if ok:
+        assert after >= before
+    else:
+        # If the SDK is unavailable, spend should NOT increase (we never
+        # got past the gate).
+        assert after == before
+
+
+def test_sync_tier_cost_monotonic():
+    """Longer prompts cost more."""
+    from iai_mcp.batch import _sync_tier_cost
+
+    a = _sync_tier_cost(1000, 500)
+    b = _sync_tier_cost(2000, 500)
+    assert b > a