feat: refactor node spec and add mcp tools (#244)

* refactor: carve out extraction panel * refactor: create spec versions for node types * refactor: create a GenericNode and remove custom nodes * feat: add python and typescript sdk * add dograh sdk * fix: fetch draft workflow definition over published one * fix: fix routes of SDKs to use code gen * chore: remove doclink dependency to reduce image size * chore: format files * chore: bump pipecat * feat: let mcp fetch archived workflows on demand * chore: fix tests * feat: add sdk documentation * chore: change banner and add badge
2026-07-25 12:01:04 +02:00 · 2026-04-21 07:56:16 +05:30 · 2026-04-21 07:56:16 +05:30 · 00a1a22b74
commit 00a1a22b74
parent 0a61ef295f
162 changed files with 14355 additions and 3554 deletions
--- a/.dockerignore
+++ b/.dockerignore
@ -1,2 +1,4 @@
 api/.env
 evals/
+api/mcp_server/ts_validator/node_modules/
+sdk/
--- a/.gitignore
+++ b/.gitignore
@ -16,4 +16,5 @@ venv/
 .playwright-mcp
 coturn/
 *.wav
-dograh_pcm_cache/
+dograh_pcm_cache/
+node_modules/
--- a/api/Dockerfile
+++ b/api/Dockerfile
@ -13,11 +13,6 @@ RUN apt-get update && apt-get install -y \
 # Copy and install requirements
 COPY api/requirements.txt .

-# Install CPU-only PyTorch FIRST to prevent CUDA/NVIDIA dependencies
-# This satisfies torch dependency before other packages try to pull GPU version
-RUN pip install --user --no-cache-dir torch --index-url https://download.pytorch.org/whl/cpu && \
-    rm -rf /root/.cache/pip
-
 # Install dependencies to user directory for easy copying
 RUN pip install --user --no-cache-dir -r requirements.txt && \
    # Clean up pip cache after installation
@ -25,27 +20,54 @@ RUN pip install --user --no-cache-dir -r requirements.txt && \

 # Copy and install pipecat from local submodule
 COPY pipecat /tmp/pipecat
-RUN pip install --user --no-cache-dir '/tmp/pipecat[cartesia,deepgram,openai,elevenlabs,groq,google,azure,sarvam,soundfile,silero,webrtc,local-smart-turn-v3,speechmatics,openrouter,camb]' && \
+RUN pip install --user --no-cache-dir '/tmp/pipecat[cartesia,deepgram,openai,elevenlabs,groq,google,azure,sarvam,soundfile,silero,webrtc,speechmatics,openrouter,camb]' && \
+    # Swap opencv-python (pulled by pipecat[webrtc]) for opencv-python-headless
+    # to drop X11/Qt dependencies that otherwise require libxcb etc. in runner.
+    pip uninstall -y opencv-python && \
+    pip install --user --no-cache-dir opencv-python-headless && \
    # Pre-download NLTK punkt_tab tokenizer data (required by pipecat at runtime)
    python -c "import nltk; nltk.download('punkt_tab', quiet=True)" && \
    # Clean up pip cache and temporary pipecat directory
    rm -rf /root/.cache/pip /tmp/pipecat

-# Remove unnecessary Python cache files from installed packages
+# Strip cache files, test/example dirs, and type stubs from installed packages
 RUN find /root/.local -type f -name '*.pyc' -delete && \
-    find /root/.local -type d -name '__pycache__' -delete && \
-    find /root/.local -type f -name '*.pyo' -delete
+    find /root/.local -type d -name '__pycache__' -prune -exec rm -rf {} + && \
+    find /root/.local -type f -name '*.pyo' -delete && \
+    find /root/.local -type d \( -name tests -o -name test -o -name examples \) -prune -exec rm -rf {} + && \
+    find /root/.local -name '*.pyi' -delete

-# Stage 2: Runtime - Minimal image with only runtime dependencies
+# Stage 2: Node deps for ts_validator (built with full node:22-slim, only
+# node_modules is copied into the runner).
+FROM node:22-slim AS ts-deps
+WORKDIR /ts_validator
+COPY api/mcp_server/ts_validator/package*.json ./
+RUN npm ci --omit=dev && npm cache clean --force
+
+# Stage 3: Static ffmpeg binary (avoids apt ffmpeg pulling mesa/libllvm for
+# hardware acceleration we don't use server-side).
+FROM debian:trixie-slim AS ffmpeg-static
+RUN apt-get update && apt-get install -y --no-install-recommends \
+        curl ca-certificates xz-utils \
+    && curl -fsSL -o /tmp/ffmpeg.tar.xz https://johnvansickle.com/ffmpeg/releases/ffmpeg-release-amd64-static.tar.xz \
+    && mkdir -p /tmp/ffmpeg \
+    && tar -xJf /tmp/ffmpeg.tar.xz -C /tmp/ffmpeg --strip-components=1 \
+    && mv /tmp/ffmpeg/ffmpeg /tmp/ffmpeg/ffprobe /usr/local/bin/ \
+    && chmod +x /usr/local/bin/ffmpeg /usr/local/bin/ffprobe
+
+# Stage 4: Runtime - Minimal image with only runtime dependencies
 FROM python:3.12-slim AS runner

 WORKDIR /app

-# Only install ffmpeg (runtime dependency)
-RUN apt-get update && apt-get install -y --no-install-recommends \
-    ffmpeg \
-    && apt-get clean \
-    && rm -rf /var/lib/apt/lists/*
+# Static ffmpeg + ffprobe (used by audio_converter, audio_file_cache, etc.)
+COPY --from=ffmpeg-static /usr/local/bin/ffmpeg /usr/local/bin/ffmpeg
+COPY --from=ffmpeg-static /usr/local/bin/ffprobe /usr/local/bin/ffprobe
+
+# Node.js 22 binary only (ts_validator subprocess needs node >=22.6 for
+# native TypeScript stripping; see api/mcp_server/ts_bridge.py). python:3.12-slim
+# already provides libstdc++6, libgcc-s1, and ca-certificates that node needs.
+COPY --from=node:22-slim /usr/local/bin/node /usr/local/bin/node

 # Copy Python packages from builder stage
 COPY --from=builder /root/.local /root/.local
@ -65,6 +87,10 @@ ENV PYTHONUNBUFFERED=1
 COPY ./api ./api
 COPY ./scripts/start_services_dev.sh ./scripts/start_services_dev.sh

+# ts_validator Node deps (built in ts-deps stage with full node:22-slim image).
+# The validator runs as a short-lived subprocess from api/mcp_server/ts_bridge.py.
+COPY --from=ts-deps /ts_validator/node_modules ./api/mcp_server/ts_validator/node_modules
+
 # Product documentation — read at runtime by the MCP docs tools
 # (search_dograh_docs / fetch_dograh_doc) so agents can learn Dograh.
 COPY ./docs ./docs
--- a/api/app.py
+++ b/api/app.py
@ -27,7 +27,7 @@ from fastapi.middleware.cors import CORSMiddleware
 from loguru import logger

 from api.constants import REDIS_URL
-from api.mcp import mcp
+from api.mcp_server import mcp
 from api.routes.main import router as main_router
 from api.services.pipecat.tracing_config import (
    handle_langfuse_sync,
--- a/api/mcp/init.py
+++ b/api/mcp/init.py
@ -1,3 +0,0 @@
-from api.mcp.server import mcp
-
-__all__ = ["mcp"]
--- a/api/mcp/auth.py
+++ b/api/mcp/auth.py
@ -1,25 +0,0 @@
-from fastapi import HTTPException
-from fastmcp.server.dependencies import get_http_headers
-
-from api.db.models import UserModel
-from api.services.auth.depends import _handle_api_key_auth
-
-
-async def authenticate_mcp_request() -> UserModel:
-    """Resolve the authenticated Dograh user for an MCP tool invocation.
-
-    Accepts either `X-API-Key: <key>` or `Authorization: Bearer <key>`,
-    reusing the API-key flow from `api.services.auth.depends`.
-    """
-    headers = get_http_headers()
-    api_key = headers.get("x-api-key")
-    if not api_key:
-        auth = headers.get("authorization", "")
-        if auth.lower().startswith("bearer "):
-            api_key = auth.split(" ", 1)[1].strip()
-    if not api_key:
-        raise HTTPException(
-            status_code=401,
-            detail="Missing API key — send X-API-Key or Authorization: Bearer <key>",
-        )
-    return await _handle_api_key_auth(api_key)
--- a/api/mcp/server.py
+++ b/api/mcp/server.py
@ -1,6 +0,0 @@
-from fastmcp import FastMCP
-
-mcp = FastMCP("dograh")
-
-from api.mcp.tools import docs as _docs  # noqa: E402, F401
-from api.mcp.tools import workflows as _workflows  # noqa: E402, F401
--- a/api/mcp/tools/docs.py
+++ b/api/mcp/tools/docs.py
@ -1,115 +0,0 @@
-import re
-from functools import lru_cache
-from pathlib import Path
-
-from fastapi import HTTPException
-from rank_bm25 import BM25Okapi
-
-from api.mcp.server import mcp
-
-DOCS_ROOT = Path(__file__).resolve().parents[3] / "docs"
-
-_TOKEN_RE = re.compile(r"[A-Za-z0-9_]+")
-_FRONTMATTER_RE = re.compile(r"^---\n(.*?)\n---\n", re.DOTALL)
-_TITLE_RE = re.compile(r"^title:\s*['\"]?(.+?)['\"]?\s*$", re.MULTILINE)
-_H1_RE = re.compile(r"^#\s+(.+?)\s*$", re.MULTILINE)
-
-
-def _tokenize(text: str) -> list[str]:
-    return [t.lower() for t in _TOKEN_RE.findall(text)]
-
-
-def _extract_title(path: Path, body: str) -> str:
-    fm_match = _FRONTMATTER_RE.match(body)
-    if fm_match:
-        title_match = _TITLE_RE.search(fm_match.group(1))
-        if title_match:
-            return title_match.group(1).strip()
-    h1_match = _H1_RE.search(body)
-    if h1_match:
-        return h1_match.group(1).strip()
-    return path.stem.replace("-", " ").title()
-
-
-def _strip_frontmatter(body: str) -> str:
-    return _FRONTMATTER_RE.sub("", body, count=1)
-
-
-@lru_cache(maxsize=1)
-def _load_index() -> tuple[list[dict], BM25Okapi]:
-    """Read every docs/**/*.mdx file once and build a BM25 index.
-
-    Cached for the process lifetime — docs rarely change between restarts.
-    """
-    docs: list[dict] = []
-    corpus: list[list[str]] = []
-
-    for path in sorted(DOCS_ROOT.rglob("*.mdx")):
-        body = path.read_text(encoding="utf-8")
-        rel = path.relative_to(DOCS_ROOT).as_posix()
-        title = _extract_title(path, body)
-        content = _strip_frontmatter(body)
-        docs.append({"path": rel, "title": title, "content": content})
-        corpus.append(_tokenize(f"{title} {content}"))
-
-    return docs, BM25Okapi(corpus)
-
-
-def _snippet(content: str, query_tokens: list[str], width: int = 240) -> str:
-    lowered = content.lower()
-    for tok in query_tokens:
-        idx = lowered.find(tok)
-        if idx >= 0:
-            start = max(0, idx - width // 2)
-            end = min(len(content), start + width)
-            return (
-                ("…" if start > 0 else "")
-                + content[start:end].strip()
-                + ("…" if end < len(content) else "")
-            )
-    return content[:width].strip() + ("…" if len(content) > width else "")
-
-
-@mcp.tool
-async def search_dograh_docs(query: str, limit: int = 5) -> list[dict]:
-    """Search Dograh's product documentation.
-
-    Returns the top matches as {path, title, snippet}. Pass the returned
-    `path` to `fetch_dograh_doc` to read the full page. Use this first
-    when you need to learn how a Dograh feature works before building
-    against it.
-    """
-    docs, bm25 = _load_index()
-    tokens = _tokenize(query)
-    if not tokens:
-        return []
-
-    scores = bm25.get_scores(tokens)
-    ranked = sorted(zip(scores, docs), key=lambda pair: pair[0], reverse=True)[:limit]
-
-    return [
-        {
-            "path": doc["path"],
-            "title": doc["title"],
-            "snippet": _snippet(doc["content"], tokens),
-            "score": round(float(score), 3),
-        }
-        for score, doc in ranked
-        if score > 0
-    ]
-
-
-@mcp.tool
-async def fetch_dograh_doc(path: str) -> dict:
-    """Fetch the full content of a Dograh docs page by its path
-    (e.g. `core-concepts/workflows.mdx`), as returned by `search_dograh_docs`.
-    """
-    docs, _ = _load_index()
-    for doc in docs:
-        if doc["path"] == path:
-            return {
-                "path": doc["path"],
-                "title": doc["title"],
-                "content": doc["content"],
-            }
-    raise HTTPException(status_code=404, detail=f"Doc not found: {path}")
--- a/api/mcp_server/init.py
+++ b/api/mcp_server/init.py
@ -0,0 +1,3 @@
+from api.mcp_server.server import mcp
+
+__all__ = ["mcp"]
--- a/api/mcp_server/auth.py
+++ b/api/mcp_server/auth.py
@ -0,0 +1,46 @@
+from fastapi import HTTPException
+from fastmcp.server.dependencies import get_http_headers
+from opentelemetry import trace
+
+from api.db.models import UserModel
+from api.services.auth.depends import _handle_api_key_auth
+
+
+async def authenticate_mcp_request() -> UserModel:
+    """Resolve the authenticated Dograh user for an MCP tool invocation.
+
+    Accepts either `X-API-Key: <key>` or `Authorization: Bearer <key>`,
+    reusing the API-key flow from `api.services.auth.depends`.
+
+    Tags the currently-active OTel span with the resolved organization
+    and user identifiers. `_OrgRoutingExporter` reads `dograh.org_id`
+    at export time to dispatch the span to the right Langfuse project;
+    the `langfuse.user.id` / `langfuse.session.id` attributes make the
+    span filterable in the Langfuse UI.
+    """
+    headers = get_http_headers()
+    api_key = headers.get("x-api-key")
+    if not api_key:
+        auth = headers.get("authorization", "")
+        if auth.lower().startswith("bearer "):
+            api_key = auth.split(" ", 1)[1].strip()
+    if not api_key:
+        raise HTTPException(
+            status_code=401,
+            detail="Missing API key — send X-API-Key or Authorization: Bearer <key>",
+        )
+    user = await _handle_api_key_auth(api_key)
+
+    span = trace.get_current_span()
+    if span.is_recording():
+        org_id = user.selected_organization_id
+        # Intentionally NOT `dograh.org_id` — that attribute triggers the
+        # per-org Langfuse routing for pipeline spans, and MCP traffic
+        # should land in the default (developer-facing) project only.
+        # Exposed under `mcp.org_id` for Langfuse UI filtering without
+        # affecting the router.
+        span.set_attribute("mcp.org_id", str(org_id))
+        span.set_attribute("mcp.user_id", str(user.id))
+        span.set_attribute("langfuse.user.id", str(user.id))
+
+    return user
--- a/api/mcp_server/instructions.py
+++ b/api/mcp_server/instructions.py
@ -0,0 +1,124 @@
+"""Top-level orchestration guide surfaced to every MCP session.
+
+Sent to the client via `FastMCP(instructions=...)` — the client bakes
+this into its system prompt, so every LLM session sees it before the
+first tool call. Prefer procedural orchestration here (call order, error
+handling, hard constraints). Design-level per-field guidance belongs in
+each `PropertySpec.llm_hint`; it flows out through `get_node_type` and
+doesn't need to be repeated here.
+
+Extend based on real LLM failures — every bullet below ideally maps to a
+mistake the system has seen at least once.
+"""
+
+DOGRAH_MCP_INSTRUCTIONS = """\
+You build and edit Dograh voice-AI workflows by emitting TypeScript that
+uses the `@dograh/sdk` package. Workflows are stored as JSON; this server
+projects them to TypeScript for editing and parses them back on save.
+
+## Call order
+
+1. `list_workflows` — locate the target workflow.
+2. `get_workflow_code(workflow_id)` — fetch the current source (draft if
+   one exists, otherwise published).
+3. (optional) `list_node_types` / `get_node_type(name)` — consult before
+   adding or editing a node type whose fields aren't already visible in
+   the current code.
+4. Mutate the code in place. Preserve existing nodes, edges, and variable
+   names unless the task requires removing or renaming them.
+5. `save_workflow(workflow_id, code)` — persist as a new draft. The
+   published version is untouched.
+
+## Allowed source shape
+
+The parser is AST-only and rejects anything outside this grammar. At the
+top level, only three statement forms are accepted:
+
+    import ... from "...";                      // any import
+    const <var> = <initializer>;                // bindings (see below)
+    wf.edge(<src>, <tgt>, { label, condition }); // bare edge calls
+
+`<initializer>` is one of:
+    new Workflow({ name: "..." })
+    wf.addTyped(<factory>({ ...fields }) [, { position: [x, y] }])
+    wf.add({ type: "<nodeType>", ...fields [, position: [x, y]] })
+
+No functions, arrow fns, loops, conditionals, ternaries, spreads,
+destructuring, template interpolation, `export`, or `.map`/`.forEach`.
+Data-position values must be plain literals (strings, numbers, booleans,
+null, arrays/objects of same). A single `new Workflow(...)` per file —
+the `name` you pass there is the workflow's display name and is applied
+on save (renames propagate immediately; definition changes go to draft).
+
+## Adding edges — explicit syntax
+
+    wf.edge(source, target, { label: "...", condition: "..." });
+
+Rules:
+- `source` and `target` are the **bare variable identifiers** bound by
+  `wf.addTyped(...)` / `wf.add(...)` — not strings, not `.id`, not inline
+  factories. Both must be declared earlier in the file.
+- `label` is a short tag (≤4 words) shown in call logs to identify the
+  branch: `"qualified"`, `"wrap up"`, `"retry"`.
+- `condition` is a full natural-language predicate the runtime evaluates
+  against the live conversation: `"caller confirmed interest in a demo"`,
+  not `"interested"`. Condition clarity determines routing accuracy.
+- Both fields are required and must be non-empty strings.
+- Edges are directional; emit one `wf.edge(...)` per outgoing branch.
+- Place all edges after all node bindings; group by source node.
+
+Example:
+
+    const greet = wf.addTyped(startCall({ name: "Greet", prompt: "Hi!" }));
+    const done  = wf.addTyped(endCall({ name: "Done", prompt: "Bye." }));
+    wf.edge(greet, done, {
+        label: "wrap up",
+        condition: "user acknowledged the greeting and is ready to end"
+    });
+
+## Hard graph constraints
+
+- Exactly one `startCall` node per workflow; no incoming edges.
+- `endCall` nodes have no outgoing edges.
+- `globalNode` has no incoming or outgoing edges; its prompt is prepended
+  to every other node's prompt at runtime when that node sets
+  `add_global_prompt=true`.
+- Every non-global node must be reachable from `startCall`.
+
+## Iterating on errors
+
+`save_workflow` returns one of:
+  - `parse_error`      Disallowed construct (see grammar above) or
+                       malformed TypeScript.
+  - `validation_error` Node data failed spec validation (unknown field,
+                       missing required, wrong type, bad `options` value).
+  - `graph_validation` Structural rule broken (missing startCall,
+                       unreachable node, edge to/from wrong node type).
+  - `bridge_error`     Internal — retry once, then surface to the user.
+
+Every error carries `line` and `column`. Fix at that location and
+resubmit the **complete source** — this tool does not accept patches.
+
+## Field conventions
+
+- `data.name` is the canonical identifier. Pick a descriptive name
+  (`"Qualify Budget"`, not `"Node1"`) — the generated code uses it as
+  the variable name and call logs reference it.
+- Reference fields take UUIDs, not human names:
+    `tool_refs`, `document_refs` → from `list_tools`, `list_documents`
+    `credential_ref`             → from `list_credentials`
+    `recording_ref`              → from `list_recordings`
+- `mention_textarea` fields (prompts, greetings, etc.) accept
+  `{{template_variables}}` — values resolved at runtime from
+  `pre_call_fetch`, caller context, or earlier extraction passes.
+
+## Style
+
+- Prefer `wf.addTyped(factory({ ... }))` over `wf.add({ type, ... })`.
+- Only include fields whose values differ from the spec default — the
+  parser re-applies defaults on save, so extras are noise.
+- Omit `position`; the server reconciles positions against the previous
+  saved workflow and lays out new nodes automatically.
+- Add nodes in call-flow order (start → intermediate → end) so the
+  generated code reads top-to-bottom, with all edges after all nodes.
+"""
--- a/api/mcp_server/server.py
+++ b/api/mcp_server/server.py
@ -0,0 +1,11 @@
+from fastmcp import FastMCP
+
+from api.mcp_server.instructions import DOGRAH_MCP_INSTRUCTIONS
+
+mcp = FastMCP("dograh", instructions=DOGRAH_MCP_INSTRUCTIONS)
+
+from api.mcp_server.tools import catalog as _catalog  # noqa: E402, F401
+from api.mcp_server.tools import get_workflow_code as _get_workflow_code  # noqa: E402, F401
+from api.mcp_server.tools import node_types as _node_types  # noqa: E402, F401
+from api.mcp_server.tools import save_workflow as _save_workflow  # noqa: E402, F401
+from api.mcp_server.tools import workflows as _workflows  # noqa: E402, F401
--- a/api/mcp_server/tools/init.py
+++ b/api/mcp_server/tools/init.py
--- a/api/mcp_server/tools/catalog.py
+++ b/api/mcp_server/tools/catalog.py
@ -0,0 +1,113 @@
+"""MCP discovery tools for the reference catalogs.
+
+Node properties of type `tool_refs`, `document_refs`, `recording_ref`, and
+`credential_ref` carry UUIDs that resolve against these catalogs. LLMs must
+list the catalog before populating those fields with real UUIDs.
+"""
+
+from api.db import db_client
+from api.mcp_server.auth import authenticate_mcp_request
+from api.mcp_server.server import mcp
+from api.mcp_server.tracing import traced_tool
+
+
+@mcp.tool
+@traced_tool
+async def list_tools(status: str | None = "active") -> list[dict]:
+    """List tools the agent can invoke during a call.
+
+    Returns each tool's `tool_uuid` (use this in node `tool_uuids` properties),
+    `name`, `description`, and `category`. Pass `status=None` to include
+    archived tools.
+    """
+    user = await authenticate_mcp_request()
+    tools = await db_client.get_tools_for_organization(
+        organization_id=user.selected_organization_id,
+        status=status,
+    )
+    return [
+        {
+            "tool_uuid": t.tool_uuid,
+            "name": t.name,
+            "description": t.description or "",
+            "category": t.category,
+        }
+        for t in tools
+    ]
+
+
+@mcp.tool
+@traced_tool
+async def list_documents() -> list[dict]:
+    """List knowledge-base documents the agent can reference during a call.
+
+    Returns each document's `document_uuid` (use this in node
+    `document_uuids` properties), `filename`, and `processing_status`.
+    """
+    user = await authenticate_mcp_request()
+    documents = await db_client.get_documents_for_organization(
+        organization_id=user.selected_organization_id,
+    )
+    return [
+        {
+            "document_uuid": d.document_uuid,
+            "filename": d.filename,
+            "processing_status": d.processing_status,
+            "total_chunks": d.total_chunks,
+        }
+        for d in documents
+    ]
+
+
+@mcp.tool
+@traced_tool
+async def list_credentials() -> list[dict]:
+    """List external credentials available for webhook auth and pre-call fetch.
+
+    Returns each credential's `credential_uuid` (use this in node
+    `credential_uuid` / `pre_call_fetch_credential_uuid` properties), `name`,
+    `description`, and `credential_type`.
+    """
+    user = await authenticate_mcp_request()
+    credentials = await db_client.get_credentials_for_organization(
+        organization_id=user.selected_organization_id,
+    )
+    return [
+        {
+            "credential_uuid": c.credential_uuid,
+            "name": c.name,
+            "description": c.description or "",
+            "credential_type": c.credential_type,
+        }
+        for c in credentials
+    ]
+
+
+@mcp.tool
+@traced_tool
+async def list_recordings(workflow_id: int | None = None) -> list[dict]:
+    """List pre-recorded audio files available for greetings and edge
+    transition speech.
+
+    Returns each recording's `recording_id` (use this in
+    `greeting_recording_id` / `transition_speech_recording_id` properties),
+    `transcript`, and TTS metadata. Pass `workflow_id` to filter to one
+    workflow's recordings.
+    """
+    user = await authenticate_mcp_request()
+    recordings = await db_client.get_recordings(
+        organization_id=user.selected_organization_id,
+        workflow_id=workflow_id,
+    )
+    return [
+        {
+            "id": r.id,
+            "recording_id": r.recording_id,
+            "workflow_id": r.workflow_id,
+            "transcript": r.transcript,
+            "tts_provider": r.tts_provider,
+            "tts_model": r.tts_model,
+            "tts_voice_id": r.tts_voice_id,
+        }
+        for r in recordings
+    ]
--- a/api/mcp_server/tools/get_workflow_code.py
+++ b/api/mcp_server/tools/get_workflow_code.py
@ -0,0 +1,71 @@
+"""MCP tool that returns a workflow as SDK TypeScript code.
+
+Companion to `save_workflow`: the LLM calls `get_workflow_code` to see
+the current state of a workflow as editable code, mutates it, and calls
+`save_workflow` with the new code. Storage stays JSON; the TS form is
+an ephemeral projection for the LLM edit loop.
+
+Selection priority: latest draft → latest published → legacy
+`workflow.workflow_definition`. That matches the UI's "whichever is the
+working copy" behavior so the LLM sees what a human editor would see.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+from fastapi import HTTPException
+
+from api.db import db_client
+from api.mcp_server.auth import authenticate_mcp_request
+from api.mcp_server.server import mcp
+from api.mcp_server.tracing import traced_tool
+from api.mcp_server.ts_bridge import TsBridgeError, generate_code
+
+
+@mcp.tool
+@traced_tool
+async def get_workflow_code(workflow_id: int) -> dict[str, Any]:
+    """Return the workflow as SDK TypeScript code the LLM can edit.
+
+    Output shape:
+        {"code": "<TS source>", "workflow_id": int, "version": "draft" | "published" | "legacy"}
+
+    The LLM edits `code`, then calls `save_workflow(workflow_id, code)`.
+    """
+    user = await authenticate_mcp_request()
+
+    workflow = await db_client.get_workflow(
+        workflow_id, organization_id=user.selected_organization_id
+    )
+    if not workflow:
+        raise HTTPException(status_code=404, detail=f"Workflow {workflow_id} not found")
+
+    # Draft wins over published — editing a draft is the normal flow.
+    # `current_definition` (is_current=True) is the published row, so we
+    # fetch the draft explicitly. If the latest draft was just published,
+    # no draft row exists and we fall through to `released_definition`.
+    draft = await db_client.get_draft_version(workflow_id)
+    released = workflow.released_definition
+
+    if draft is not None and draft.workflow_json:
+        payload = draft.workflow_json
+        source = "draft"
+    elif released is not None and released.workflow_json:
+        payload = released.workflow_json
+        source = "published"
+    else:
+        payload = workflow.workflow_definition or {}
+        source = "legacy"
+
+    try:
+        code = await generate_code(payload, workflow_name=workflow.name or "")
+    except TsBridgeError as e:
+        raise HTTPException(status_code=500, detail=f"Failed to generate code: {e}")
+
+    return {
+        "workflow_id": workflow_id,
+        "name": workflow.name or "",
+        "version": source,
+        "code": code,
+    }
--- a/api/mcp_server/tools/node_types.py
+++ b/api/mcp_server/tools/node_types.py
@ -0,0 +1,57 @@
+"""MCP discovery tools for node specifications.
+
+LLMs call these tools first to learn the available node-type catalog and
+each node's property schema before composing or modifying a workflow.
+"""
+
+from fastapi import HTTPException
+
+from api.mcp_server.auth import authenticate_mcp_request
+from api.mcp_server.server import mcp
+from api.mcp_server.tracing import traced_tool
+from api.services.workflow.node_specs import SPEC_VERSION, all_specs, get_spec
+
+
+@mcp.tool
+@traced_tool
+async def list_node_types() -> dict:
+    """List every available node type with a brief summary.
+
+    Use this first to discover what nodes exist, then call `get_node_type`
+    for the full schema of any node you intend to use.
+
+    Returns:
+        A dict with `spec_version` (pin against this in any generated workflow
+        code) and `node_types` (list of {name, display_name, description,
+        category}).
+    """
+    await authenticate_mcp_request()
+    return {
+        "spec_version": SPEC_VERSION,
+        "node_types": [
+            {
+                "name": spec.name,
+                "display_name": spec.display_name,
+                "description": spec.description,
+                "category": spec.category.value,
+            }
+            for spec in all_specs()
+        ],
+    }
+
+
+@mcp.tool
+@traced_tool
+async def get_node_type(name: str) -> dict:
+    """Fetch the full schema for a node type, including every property's
+    type, default, conditional visibility rules, and LLM-readable
+    description, plus worked examples.
+
+    Use the property `description` and the `examples` list to understand
+    semantics — types alone are not enough.
+    """
+    await authenticate_mcp_request()
+    spec = get_spec(name)
+    if spec is None:
+        raise HTTPException(status_code=404, detail=f"Unknown node type: {name!r}")
+    return spec.model_dump(mode="json")
--- a/api/mcp_server/tools/save_workflow.py
+++ b/api/mcp_server/tools/save_workflow.py
@ -0,0 +1,168 @@
+"""MCP tool that accepts LLM-authored SDK TypeScript and saves it as a draft.
+
+Execution flow:
+    1. Parse via the Node TS validator — AST-only, never executes the code.
+       Returns either a workflow JSON or per-location parse/validate errors.
+    2. Pydantic validation via `ReactFlowDTO.model_validate` (defence in
+       depth; the parser is already spec-driven, but the DTO layer is the
+       authoritative wire-format gate).
+    3. Graph validation via `WorkflowGraph`.
+    4. Save as a new draft via `db_client.save_workflow_draft` — the
+       published version stays intact, so edits are rollback-safe.
+
+Error codes surfaced to the LLM:
+    parse_error       — TS parse failed or a disallowed construct was used
+    validation_error  — node data failed spec validation (unknown field,
+                        missing required, wrong type, option out of range)
+    schema_validation — ReactFlowDTO Pydantic rejection (rare; parser bug)
+    graph_validation  — semantic graph rule broken (e.g. no start node)
+    bridge_error      — Node subprocess failed before returning JSON
+
+All LLM-facing errors include file:line:column where available so the
+LLM can correct its code directly.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+from fastapi import HTTPException
+from loguru import logger
+from pydantic import ValidationError as PydanticValidationError
+
+from api.db import db_client
+from api.mcp_server.auth import authenticate_mcp_request
+from api.mcp_server.server import mcp
+from api.mcp_server.tracing import traced_tool
+from api.mcp_server.ts_bridge import TsBridgeError, parse_code
+from api.services.workflow.dto import ReactFlowDTO
+from api.services.workflow.layout import reconcile_positions
+from api.services.workflow.workflow import WorkflowGraph
+
+
+async def _previous_workflow_json(workflow: Any) -> dict[str, Any] | None:
+    """Same selection priority as `get_workflow_code` — the version the
+    LLM saw is the version we reconcile against.
+
+    `current_definition` (is_current=True) is the published row, so the
+    draft must be fetched explicitly. If no draft exists (e.g. the last
+    draft was just published), fall through to `released_definition`.
+    """
+    draft = await db_client.get_draft_version(workflow.id)
+    if draft is not None and draft.workflow_json:
+        return draft.workflow_json
+    released = workflow.released_definition
+    if released is not None and released.workflow_json:
+        return released.workflow_json
+    return workflow.workflow_definition or None
+
+
+def _error_result(code: str, message: str, **extra: Any) -> dict[str, Any]:
+    return {"saved": False, "error_code": code, "error": message, **extra}
+
+
+def _format_errors(errors: list[dict[str, Any]]) -> str:
+    parts: list[str] = []
+    for e in errors:
+        loc = ""
+        line = e.get("line")
+        col = e.get("column")
+        if line is not None:
+            loc = f" (line {line}" + (f", col {col}" if col is not None else "") + ")"
+        parts.append(f"{e.get('message', '')}{loc}")
+    return "\n".join(parts)
+
+
+@mcp.tool
+@traced_tool
+async def save_workflow(workflow_id: int, code: str) -> dict[str, Any]:
+    """Parse SDK TypeScript and save the resulting workflow as a draft.
+
+    `code` is TypeScript source using `@dograh/sdk`. Fetch the current
+    code first via `get_workflow_code(workflow_id)`, edit it, then pass
+    the full updated source here.
+
+    Example code:
+        import { Workflow } from "@dograh/sdk";
+        import { startCall, endCall } from "@dograh/sdk/typed";
+
+        const wf = new Workflow({ name: "lead_qualification" });
+        const greeting = wf.addTyped(startCall({ name: "Greeting", prompt: "Hi!" }));
+        const done     = wf.addTyped(endCall({ name: "Done", prompt: "Bye." }));
+        wf.edge(greeting, done, { label: "done", condition: "conversation complete" });
+
+    On success the draft version is saved; the published version is
+    untouched.
+    """
+    user = await authenticate_mcp_request()
+
+    workflow = await db_client.get_workflow(
+        workflow_id, organization_id=user.selected_organization_id
+    )
+    if not workflow:
+        raise HTTPException(status_code=404, detail=f"Workflow {workflow_id} not found")
+
+    # 1. Parse + spec-validate via the Node TS validator.
+    try:
+        parsed = await parse_code(code)
+    except TsBridgeError as e:
+        logger.warning(f"ts_bridge failure: {e}")
+        return _error_result("bridge_error", str(e))
+
+    if not parsed.get("ok"):
+        stage = parsed.get("stage", "parse")
+        errs = parsed.get("errors") or []
+        code_key = "parse_error" if stage == "parse" else "validation_error"
+        return _error_result(code_key, _format_errors(errs), errors=errs)
+
+    payload = parsed["workflow"]
+    new_name = (parsed.get("workflowName") or "").strip()
+
+    # 1b. Reconcile node positions against the previously-stored workflow.
+    # The parser drops positions by design (LLMs don't place nodes well);
+    # here we fill them back in from what was there before, and pick
+    # approximate placements for newly-introduced nodes.
+    payload = reconcile_positions(payload, await _previous_workflow_json(workflow))
+
+    # 2. Pydantic shape check (defence in depth — parser is spec-driven).
+    try:
+        dto = ReactFlowDTO.model_validate(payload)
+    except PydanticValidationError as e:
+        return _error_result("schema_validation", str(e))
+
+    # 3. Graph-level semantic validation (start-node count, edge shape).
+    try:
+        WorkflowGraph(dto)
+    except (ValueError, Exception) as e:  # WorkflowGraph raises ValueError
+        return _error_result("graph_validation", str(e))
+
+    # 4a. If the `new Workflow({ name })` in the edited source differs from
+    # the stored name, rename the workflow. Name is a workflow-level field
+    # (not versioned), so this takes effect immediately.
+    name_changed = bool(new_name) and new_name != workflow.name
+    if name_changed:
+        await db_client.update_workflow(
+            workflow_id=workflow_id,
+            name=new_name,
+            workflow_definition=None,
+            template_context_variables=None,
+            workflow_configurations=None,
+            organization_id=user.selected_organization_id,
+        )
+
+    # 4b. Save as a new draft (existing published version stays intact).
+    draft = await db_client.save_workflow_draft(
+        workflow_id=workflow_id,
+        workflow_definition=payload,
+    )
+
+    return {
+        "saved": True,
+        "workflow_id": workflow_id,
+        "version_number": draft.version_number,
+        "status": draft.status,
+        "node_count": len(payload["nodes"]),
+        "edge_count": len(payload["edges"]),
+        "name": new_name or workflow.name,
+        "renamed": name_changed,
+    }
--- a/api/mcp_server/tools/workflows.py
+++ b/api/mcp_server/tools/workflows.py
@ -1,17 +1,20 @@
 from fastapi import HTTPException

 from api.db import db_client
-from api.mcp.auth import authenticate_mcp_request
-from api.mcp.server import mcp
+from api.mcp_server.auth import authenticate_mcp_request
+from api.mcp_server.server import mcp
+from api.mcp_server.tracing import traced_tool


@mcp.tool
-async def list_workflows(status: str | None = None) -> list[dict]:
+@traced_tool
+async def list_workflows(status: str | None = "active") -> list[dict]:
    """List agents (workflows) in the caller's organization.

    Returns id, name, status, and created_at for each agent. Use
-    `get_workflow` to fetch a single agent's full definition. Pass
-    `status="active"` or `status="archived"` to filter.
+    `get_workflow` to fetch a single agent's full definition. Defaults
+    to active agents; pass `status="archived"` to list archived agents,
+    or `status=None` to list all.
    """
    user = await authenticate_mcp_request()
    workflows = await db_client.get_all_workflows_for_listing(
@ -30,6 +33,7 @@ async def list_workflows(status: str | None = None) -> list[dict]:


@mcp.tool
+@traced_tool
 async def get_workflow(workflow_id: int) -> dict:
    """Fetch a single agent by id, including its current published definition."""
    user = await authenticate_mcp_request()
--- a/api/mcp_server/tracing.py
+++ b/api/mcp_server/tracing.py
@ -0,0 +1,87 @@
+"""OTel tracing for MCP tool invocations.
+
+The project-wide tracing setup in
+`api/services/pipecat/tracing_config.py` already routes spans to
+per-organization Langfuse projects based on the `dograh.org_id` span
+attribute. This module plugs MCP tool calls into that pipeline:
+
+    @mcp.tool
+    @traced_tool
+    async def my_tool(...): ...
+
+Each decorated invocation produces one span named `mcp.<tool_name>` with
+Langfuse-rendered input/output. Organization and user attributes are
+stamped separately by `authenticate_mcp_request` when it runs inside
+the tool body — the decorator's span is the `current_span` at that
+point, so the attributes land on the right span and the router export
+dispatches to the correct Langfuse project.
+"""
+
+from __future__ import annotations
+
+import json
+from functools import wraps
+from typing import Any, Awaitable, Callable, TypeVar
+
+from opentelemetry import trace
+from opentelemetry.context import Context
+from opentelemetry.trace import Status, StatusCode
+
+R = TypeVar("R")
+
+_TRACER = trace.get_tracer("dograh.mcp")
+# Langfuse truncates long payloads anyway; cap here to keep span size
+# bounded. Tune up if you find tool outputs consistently clipped.
+_MAX_ATTR_LEN = 8000
+
+
+def _safe_json(value: Any) -> str:
+    try:
+        return json.dumps(value, default=str, ensure_ascii=False)
+    except Exception:  # noqa: BLE001
+        return str(value)
+
+
+def traced_tool(fn: Callable[..., Awaitable[R]]) -> Callable[..., Awaitable[R]]:
+    """Wrap an MCP tool so each invocation produces a span.
+
+    Captures tool name, input kwargs, output, and exceptions. Stacks
+    below `@mcp.tool` so FastMCP sees the wrapped function when
+    introspecting the tool schema (`functools.wraps` preserves the
+    signature the framework reads).
+    """
+
+    @wraps(fn)
+    async def wrapper(*args: Any, **kwargs: Any) -> R:
+        # Each MCP tool call is its own root trace. Passing an empty
+        # `Context()` severs the inherited parent so the span doesn't
+        # graft onto whatever other trace happens to be active (e.g.
+        # the FastAPI request span, or a client-propagated context).
+        # One trace per tool invocation makes Langfuse diffing and
+        # per-org filtering clean.
+        with _TRACER.start_as_current_span(
+            f"mcp.{fn.__name__}",
+            context=Context(),
+        ) as span:
+            span.set_attribute("mcp.tool.name", fn.__name__)
+            # Explicit trace-name override so the Langfuse UI shows
+            # `mcp.<tool>` at the top of the trace instead of whatever
+            # the framework happens to name the root span.
+            span.set_attribute("langfuse.trace.name", f"mcp.{fn.__name__}")
+            span.set_attribute(
+                "langfuse.observation.input",
+                _safe_json(kwargs)[:_MAX_ATTR_LEN],
+            )
+            try:
+                result = await fn(*args, **kwargs)
+            except Exception as e:
+                span.record_exception(e)
+                span.set_status(Status(StatusCode.ERROR, str(e)))
+                raise
+            span.set_attribute(
+                "langfuse.observation.output",
+                _safe_json(result)[:_MAX_ATTR_LEN],
+            )
+            return result
+
+    return wrapper
--- a/api/mcp_server/ts_bridge.py
+++ b/api/mcp_server/ts_bridge.py
@ -0,0 +1,93 @@
+"""Python-side bridge to the Node TS validator.
+
+Spawns `node api/mcp_server/ts_validator/src/index.ts` as a short-lived
+subprocess per call, streams a JSON request on stdin, reads a JSON
+response from stdout. The validator never executes LLM code — it either
+emits TypeScript from a workflow JSON (`generate`) or parses LLM-authored
+TS back into a workflow JSON via AST walking (`parse`).
+
+The subprocess startup cost is ~100-200ms per call. Fine for MCP tool
+rates; if it ever matters, the validator can be promoted to a long-lived
+worker over a unix socket without changing this interface.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import json
+from pathlib import Path
+from typing import Any
+
+from api.services.workflow.node_specs import all_specs
+
+_VALIDATOR_ENTRY = Path(__file__).resolve().parent / "ts_validator" / "src" / "index.ts"
+
+
+class TsBridgeError(Exception):
+    """The Node subprocess failed before producing a JSON response."""
+
+
+def _specs_payload() -> list[dict[str, Any]]:
+    return [s.model_dump(mode="json") for s in all_specs()]
+
+
+async def _invoke(request: dict[str, Any]) -> dict[str, Any]:
+    proc = await asyncio.create_subprocess_exec(
+        "node",
+        str(_VALIDATOR_ENTRY),
+        stdin=asyncio.subprocess.PIPE,
+        stdout=asyncio.subprocess.PIPE,
+        stderr=asyncio.subprocess.PIPE,
+    )
+    stdout, stderr = await proc.communicate(json.dumps(request).encode("utf-8"))
+    if proc.returncode != 0 and not stdout:
+        raise TsBridgeError(
+            f"ts_validator exited {proc.returncode}: "
+            f"{stderr.decode('utf-8', errors='replace')}"
+        )
+    try:
+        return json.loads(stdout.decode("utf-8"))
+    except json.JSONDecodeError as e:
+        raise TsBridgeError(
+            f"ts_validator emitted non-JSON: {stdout!r} (stderr: {stderr!r})"
+        ) from e
+
+
+async def generate_code(workflow: dict[str, Any], *, workflow_name: str = "") -> str:
+    """Emit SDK TypeScript source from a workflow JSON payload.
+
+    Raises `TsBridgeError` if the validator can't produce code (unknown
+    node type, dangling edge reference, etc.) — these are bugs at the
+    caller layer, not user input, so we fail loudly.
+    """
+    result = await _invoke(
+        {
+            "command": "generate",
+            "workflow": workflow,
+            "specs": _specs_payload(),
+            "workflowName": workflow_name,
+        }
+    )
+    if not result.get("ok"):
+        errs = result.get("errors") or [{"message": "unknown failure"}]
+        raise TsBridgeError(
+            "generate_code failed: " + "; ".join(e.get("message", "") for e in errs)
+        )
+    return result["code"]
+
+
+async def parse_code(code: str) -> dict[str, Any]:
+    """Parse LLM-authored TS back into a workflow JSON.
+
+    Returns the raw validator response — `{"ok": True, "workflow": {...}}`
+    on success, `{"ok": False, "stage": "parse" | "validate", "errors": [...]}`
+    on author-side failure. Author-side failures are surfaced to the LLM
+    verbatim so it can iterate; callers should not re-wrap them.
+    """
+    return await _invoke(
+        {
+            "command": "parse",
+            "code": code,
+            "specs": _specs_payload(),
+        }
+    )
--- a/api/mcp_server/ts_validator/.gitignore
+++ b/api/mcp_server/ts_validator/.gitignore
@ -0,0 +1 @@
+node_modules/
--- a/api/mcp_server/ts_validator/package-lock.json
+++ b/api/mcp_server/ts_validator/package-lock.json
@ -0,0 +1,31 @@
+{
+    "name": "dograh-ts-validator",
+    "version": "0.0.0",
+    "lockfileVersion": 3,
+    "requires": true,
+    "packages": {
+        "": {
+            "name": "dograh-ts-validator",
+            "version": "0.0.0",
+            "dependencies": {
+                "typescript": "^5.6.0"
+            },
+            "engines": {
+                "node": ">=22.6"
+            }
+        },
+        "node_modules/typescript": {
+            "version": "5.9.3",
+            "resolved": "https://registry.npmjs.org/typescript/-/typescript-5.9.3.tgz",
+            "integrity": "sha512-jl1vZzPDinLr9eUt3J/t7V6FgNEw9QjvBPdysz9KfQDD41fQrC2Y4vKQdiaUpFT4bXlb1RHhLpp8wtm6M5TgSw==",
+            "license": "Apache-2.0",
+            "bin": {
+                "tsc": "bin/tsc",
+                "tsserver": "bin/tsserver"
+            },
+            "engines": {
+                "node": ">=14.17"
+            }
+        }
+    }
+}
--- a/api/mcp_server/ts_validator/package.json
+++ b/api/mcp_server/ts_validator/package.json
@ -0,0 +1,13 @@
+{
+    "name": "dograh-ts-validator",
+    "private": true,
+    "version": "0.0.0",
+    "type": "module",
+    "description": "Node helper invoked by the Python MCP server. Converts workflow JSON to SDK TypeScript code (generate) and parses LLM-authored TS back into a validated workflow JSON (parse). Runs as a short-lived subprocess over stdin/stdout.",
+    "dependencies": {
+        "typescript": "^5.6.0"
+    },
+    "engines": {
+        "node": ">=22.6"
+    }
+}
--- a/api/mcp_server/ts_validator/src/generate.ts
+++ b/api/mcp_server/ts_validator/src/generate.ts
@ -0,0 +1,304 @@
+// JSON → TypeScript source. Emits flat code the LLM can read and edit:
+// imports, a `Workflow` construction, one `addTyped` per node, one `edge`
+// per edge. Variable names are derived from `data.name` (falling back to
+// the node id) and deduplicated so the AST round-trips back through
+// `parse.ts` into the same workflow JSON.
+
+import type {
+    GenerateResult,
+    NodeSpec,
+    PropertySpec,
+    WireWorkflow,
+} from "./types.ts";
+
+export function generateCode(
+    workflow: WireWorkflow,
+    specs: NodeSpec[],
+    opts: { workflowName?: string } = {},
+): GenerateResult {
+    const specByName = new Map(specs.map((s) => [s.name, s]));
+
+    // Catch unknown node types up-front — otherwise we'd emit an import
+    // line for a factory that doesn't exist.
+    for (const n of workflow.nodes) {
+        if (!specByName.has(n.type)) {
+            return {
+                ok: false,
+                errors: [
+                    {
+                        message: `Unknown node type in workflow: "${n.type}"`,
+                    },
+                ],
+            };
+        }
+    }
+
+    const factoryNames = [
+        ...new Set(workflow.nodes.map((n) => n.type)),
+    ].sort();
+    const nodeVarById = new Map<string, string>();
+    const usedNames = new Set<string>();
+
+    const lines: string[] = [];
+    lines.push(`import { Workflow } from "@dograh/sdk";`);
+    if (factoryNames.length > 0) {
+        lines.push(
+            `import { ${factoryNames.join(", ")} } from "@dograh/sdk/typed";`,
+        );
+    }
+    lines.push("");
+    const wfName = opts.workflowName ?? "";
+    lines.push(
+        `const wf = new Workflow(${renderObject({ name: wfName }, 0)});`,
+    );
+    lines.push("");
+
+    for (const node of workflow.nodes) {
+        const varName = pickVarName(node, usedNames);
+        nodeVarById.set(node.id, varName);
+
+        const spec = specByName.get(node.type)!;
+        // Strip legacy/UI-state fields the spec doesn't know about
+        // (e.g. `invalid`, `selected`, `dragging`, `is_start`,
+        // `validationMessage`). They accumulated in stored workflow
+        // data before the parser enforced spec validation, and are
+        // pure noise from the LLM's perspective — dropping them keeps
+        // the editing surface clean and avoids a pointless save-time
+        // rejection round-trip.
+        const knownOnly = stripUnknown(node.data, spec);
+        const data = stripDefaults(knownOnly, spec);
+        const factoryArg = renderObject(data, 0);
+
+        // Positions are intentionally omitted — LLMs don't place nodes
+        // sensibly, so we let a downstream auto-layout pass (future
+        // enhancement) assign coordinates on save. Existing positions
+        // in the DB are preserved by `parse.ts` defaulting to {0,0}
+        // and the save path leaving pre-existing node positions alone.
+        lines.push(
+            `const ${varName} = wf.addTyped(${node.type}(${factoryArg}));`,
+        );
+    }
+
+    if (workflow.edges.length > 0) {
+        lines.push("");
+    }
+    for (const edge of workflow.edges) {
+        const src = nodeVarById.get(edge.source);
+        const tgt = nodeVarById.get(edge.target);
+        if (!src || !tgt) {
+            return {
+                ok: false,
+                errors: [
+                    {
+                        message:
+                            `Edge ${edge.id} references unknown node ` +
+                            `(source=${edge.source}, target=${edge.target}).`,
+                    },
+                ],
+            };
+        }
+        const cleanedEdge = pickEdgeFields(edge.data);
+        const edgeOpts = renderObject(cleanedEdge, 0);
+        lines.push(`wf.edge(${src}, ${tgt}, ${edgeOpts});`);
+    }
+
+    return { ok: true, code: lines.join("\n") + "\n" };
+}
+
+// ─── helpers ──────────────────────────────────────────────────────────
+
+function pickVarName(
+    node: { id: string; data: Record<string, unknown> },
+    used: Set<string>,
+): string {
+    const seed =
+        typeof node.data["name"] === "string" && node.data["name"].trim()
+            ? (node.data["name"] as string)
+            : `node_${node.id}`;
+    const base = sanitizeIdentifier(seed);
+    let candidate = base;
+    let i = 2;
+    while (used.has(candidate) || RESERVED.has(candidate)) {
+        candidate = `${base}_${i++}`;
+    }
+    used.add(candidate);
+    return candidate;
+}
+
+function sanitizeIdentifier(raw: string): string {
+    const cleaned = raw
+        .trim()
+        .replace(/[^a-zA-Z0-9_]+/g, "_")
+        .replace(/^_+|_+$/g, "")
+        .toLowerCase();
+    if (!cleaned) return "node";
+    if (/^[0-9]/.test(cleaned)) return `n_${cleaned}`;
+    return cleaned;
+}
+
+const RESERVED = new Set([
+    "wf",
+    "const",
+    "let",
+    "var",
+    "new",
+    "function",
+    "class",
+    "import",
+    "export",
+    "return",
+    "if",
+    "else",
+    "for",
+    "while",
+    "do",
+    "switch",
+    "case",
+    "break",
+    "continue",
+    "default",
+    "throw",
+    "try",
+    "catch",
+    "finally",
+    "await",
+    "async",
+    "true",
+    "false",
+    "null",
+    "undefined",
+    "this",
+    "super",
+    "in",
+    "of",
+    "typeof",
+    "instanceof",
+    "delete",
+    "void",
+    "yield",
+    "Workflow",
+]);
+
+// Drop keys not declared in the spec. Handles nested `fixed_collection`
+// rows by recursing through sub-property specs. Anything that isn't in
+// the spec is legacy/UI state and should never reach the LLM.
+function stripUnknown(
+    data: Record<string, unknown>,
+    spec: NodeSpec,
+): Record<string, unknown> {
+    const known = new Map<string, PropertySpec>();
+    for (const p of spec.properties ?? []) known.set(p.name, p);
+
+    const out: Record<string, unknown> = {};
+    for (const [k, v] of Object.entries(data)) {
+        const prop = known.get(k);
+        if (!prop) continue; // drop unknown
+        if (prop.type === "fixed_collection" && Array.isArray(v)) {
+            const rowSpec: NodeSpec = {
+                name: prop.name,
+                properties: prop.properties ?? [],
+            };
+            out[k] = v.map((row) =>
+                row && typeof row === "object" && !Array.isArray(row)
+                    ? stripUnknown(row as Record<string, unknown>, rowSpec)
+                    : row,
+            );
+        } else {
+            out[k] = v;
+        }
+    }
+    return out;
+}
+
+// Edge schema is fixed (no NodeSpec for edges). Mirrors the allowed
+// fields on `Workflow.edge(...)` in both SDKs.
+const KNOWN_EDGE_FIELDS = new Set([
+    "label",
+    "condition",
+    "transition_speech",
+    "transition_speech_type",
+    "transition_speech_recording_id",
+]);
+
+function pickEdgeFields(
+    data: Record<string, unknown>,
+): Record<string, unknown> {
+    const out: Record<string, unknown> = {};
+    for (const [k, v] of Object.entries(data)) {
+        if (KNOWN_EDGE_FIELDS.has(k)) out[k] = v;
+    }
+    return out;
+}
+
+// Drop keys whose value equals the spec default — keeps emitted code tight.
+function stripDefaults(
+    data: Record<string, unknown>,
+    spec: NodeSpec,
+): Record<string, unknown> {
+    const out: Record<string, unknown> = {};
+    const defaults = new Map<string, unknown>();
+    for (const prop of spec.properties ?? []) {
+        if (prop.default !== undefined && prop.default !== null) {
+            defaults.set(prop.name, prop.default);
+        }
+    }
+    for (const [k, v] of Object.entries(data)) {
+        if (defaults.has(k) && deepEqual(defaults.get(k), v)) continue;
+        out[k] = v;
+    }
+    return out;
+}
+
+function deepEqual(a: unknown, b: unknown): boolean {
+    if (a === b) return true;
+    if (typeof a !== typeof b) return false;
+    if (a === null || b === null) return false;
+    if (Array.isArray(a) && Array.isArray(b)) {
+        if (a.length !== b.length) return false;
+        return a.every((el, i) => deepEqual(el, b[i]));
+    }
+    if (typeof a === "object" && typeof b === "object") {
+        const ak = Object.keys(a as object).sort();
+        const bk = Object.keys(b as object).sort();
+        if (ak.length !== bk.length) return false;
+        if (ak.some((k, i) => k !== bk[i])) return false;
+        return ak.every((k) =>
+            deepEqual(
+                (a as Record<string, unknown>)[k],
+                (b as Record<string, unknown>)[k],
+            ),
+        );
+    }
+    return false;
+}
+
+// Object renderer biased for readability — strings use single-line JSON,
+// nested objects/arrays indent one level per depth.
+function renderObject(obj: Record<string, unknown>, depth: number): string {
+    const keys = Object.keys(obj);
+    if (keys.length === 0) return "{}";
+    const pad = "    ".repeat(depth + 1);
+    const closingPad = "    ".repeat(depth);
+    const parts = keys.map((k) => {
+        const v = renderValue(obj[k], depth + 1);
+        return `${pad}${k}: ${v}`;
+    });
+    return `{\n${parts.join(",\n")},\n${closingPad}}`;
+}
+
+function renderValue(v: unknown, depth: number): string {
+    if (v === null || v === undefined) return "null";
+    if (typeof v === "string") return JSON.stringify(v);
+    if (typeof v === "number" || typeof v === "boolean") return String(v);
+    if (Array.isArray(v)) {
+        if (v.length === 0) return "[]";
+        const pad = "    ".repeat(depth + 1);
+        const closingPad = "    ".repeat(depth);
+        const items = v.map((el) => `${pad}${renderValue(el, depth + 1)}`);
+        return `[\n${items.join(",\n")},\n${closingPad}]`;
+    }
+    if (typeof v === "object") {
+        return renderObject(v as Record<string, unknown>, depth);
+    }
+    return JSON.stringify(v);
+}
--- a/api/mcp_server/ts_validator/src/index.ts
+++ b/api/mcp_server/ts_validator/src/index.ts
@ -0,0 +1,74 @@
+// Stdin/stdout dispatch. Reads a single JSON request, routes to
+// generate or parse, writes a single JSON response. Exits 0 on request
+// success (including validation failures — those are in the JSON), and
+// exits 1 only on internal errors (bad input JSON, unhandled exception).
+
+import { generateCode } from "./generate.ts";
+import { parseCode } from "./parse.ts";
+import type { NodeSpec, WireWorkflow } from "./types.ts";
+
+interface GenerateRequest {
+    command: "generate";
+    workflow: WireWorkflow;
+    specs: NodeSpec[];
+    workflowName?: string;
+}
+
+interface ParseRequest {
+    command: "parse";
+    code: string;
+    specs: NodeSpec[];
+}
+
+type Request = GenerateRequest | ParseRequest;
+
+async function readStdin(): Promise<string> {
+    const chunks: Buffer[] = [];
+    for await (const chunk of process.stdin) {
+        chunks.push(chunk as Buffer);
+    }
+    return Buffer.concat(chunks).toString("utf-8");
+}
+
+function writeResult(payload: unknown): void {
+    process.stdout.write(JSON.stringify(payload));
+}
+
+async function main(): Promise<void> {
+    const input = await readStdin();
+    let req: Request;
+    try {
+        req = JSON.parse(input) as Request;
+    } catch (e) {
+        writeResult({
+            ok: false,
+            stage: "internal",
+            errors: [{ message: `Invalid JSON on stdin: ${(e as Error).message}` }],
+        });
+        process.exit(1);
+    }
+
+    if (req.command === "generate") {
+        writeResult(generateCode(req.workflow, req.specs, { workflowName: req.workflowName }));
+        return;
+    }
+    if (req.command === "parse") {
+        writeResult(parseCode(req.code, req.specs));
+        return;
+    }
+    writeResult({
+        ok: false,
+        stage: "internal",
+        errors: [{ message: `Unknown command: ${(req as { command?: unknown }).command}` }],
+    });
+    process.exit(1);
+}
+
+main().catch((err: unknown) => {
+    writeResult({
+        ok: false,
+        stage: "internal",
+        errors: [{ message: (err as Error).stack ?? String(err) }],
+    });
+    process.exit(1);
+});
--- a/api/mcp_server/ts_validator/src/parse.ts
+++ b/api/mcp_server/ts_validator/src/parse.ts
@ -0,0 +1,612 @@
+// TypeScript → workflow JSON.
+//
+// Parses LLM-authored SDK code with the TypeScript compiler, walks the
+// AST statement by statement, and builds up a workflow JSON from the
+// recognized SDK patterns:
+//
+//   const wf = new Workflow({ name: "..." });
+//   const X  = wf.addTyped(startCall({ ...fields }));
+//   const Y  = wf.add({ type: "endCall", ...fields });
+//   wf.edge(X, Y, { label: "...", condition: "..." });
+//
+// No code is executed. Any top-level statement that doesn't match one
+// of the recognized shapes is a parse error with a file:line:col pointer
+// so the LLM can iterate. Node data is validated against the spec
+// catalog before returning.
+
+import ts from "typescript";
+
+import type {
+    NodeSpec,
+    ParseErrorItem,
+    ParseResult,
+    PropertySpec,
+    WireEdge,
+    WireNode,
+} from "./types.ts";
+
+export function parseCode(code: string, specs: NodeSpec[]): ParseResult {
+    const specByName = new Map(specs.map((s) => [s.name, s]));
+    const sourceFile = ts.createSourceFile(
+        "workflow.ts",
+        code,
+        ts.ScriptTarget.ESNext,
+        true,
+        ts.ScriptKind.TS,
+    );
+
+    const errors: ParseErrorItem[] = [];
+    const nodes: WireNode[] = [];
+    const edges: WireEdge[] = [];
+    const nodeRefs = new Map<string, WireNode>();
+    let workflowVar: string | null = null;
+    let workflowName = "";
+    let nextId = 1;
+
+    const addError = (node: ts.Node, message: string): void => {
+        const pos = sourceFile.getLineAndCharacterOfPosition(node.getStart());
+        errors.push({
+            message,
+            line: pos.line + 1,
+            column: pos.character + 1,
+        });
+    };
+
+    for (const stmt of sourceFile.statements) {
+        if (ts.isImportDeclaration(stmt)) continue; // imports are harmless
+        if (
+            ts.isExportAssignment(stmt) ||
+            stmt.kind === ts.SyntaxKind.EmptyStatement
+        ) {
+            continue;
+        }
+
+        // `const X = ...;` or `wf.edge(...);`
+        if (ts.isVariableStatement(stmt)) {
+            handleVariableStatement(stmt);
+            continue;
+        }
+        if (ts.isExpressionStatement(stmt)) {
+            handleExpressionStatement(stmt);
+            continue;
+        }
+        addError(
+            stmt,
+            `Only imports, \`const X = ...\` bindings, and \`wf.edge(...)\` calls are allowed at the top level. Found: ${ts.SyntaxKind[stmt.kind]}.`,
+        );
+    }
+
+    function handleVariableStatement(stmt: ts.VariableStatement): void {
+        const modifiers = ts.getModifiers(stmt);
+        if (modifiers && modifiers.some((m) => m.kind === ts.SyntaxKind.ExportKeyword)) {
+            addError(stmt, "`export` is not allowed on workflow bindings.");
+            return;
+        }
+        if ((stmt.declarationList.flags & ts.NodeFlags.Const) === 0) {
+            addError(stmt, "Use `const` for all bindings.");
+            return;
+        }
+        for (const decl of stmt.declarationList.declarations) {
+            if (!ts.isIdentifier(decl.name)) {
+                addError(decl, "Destructuring is not allowed — use a single identifier.");
+                continue;
+            }
+            if (!decl.initializer) {
+                addError(decl, "Bindings must have an initializer.");
+                continue;
+            }
+            const varName = decl.name.text;
+            handleBinding(varName, decl.initializer, decl);
+        }
+    }
+
+    function handleBinding(
+        varName: string,
+        initializer: ts.Expression,
+        origin: ts.Node,
+    ): void {
+        const expr = unwrapAwait(initializer);
+
+        // `const wf = new Workflow({ name: "..." })`
+        if (ts.isNewExpression(expr)) {
+            if (!ts.isIdentifier(expr.expression) || expr.expression.text !== "Workflow") {
+                addError(origin, "Only `new Workflow(...)` is supported for object construction.");
+                return;
+            }
+            if (workflowVar) {
+                addError(origin, `A Workflow is already bound (as \`${workflowVar}\`). Only one Workflow is allowed.`);
+                return;
+            }
+            const args = expr.arguments ?? ts.factory.createNodeArray();
+            if (args.length > 0) {
+                const val = literalToJs(args[0]!, addError);
+                if (
+                    val &&
+                    typeof val === "object" &&
+                    !Array.isArray(val) &&
+                    typeof (val as Record<string, unknown>)["name"] === "string"
+                ) {
+                    workflowName = (val as Record<string, unknown>)["name"] as string;
+                }
+            }
+            workflowVar = varName;
+            return;
+        }
+
+        // `const X = wf.addTyped(factory({...}))` or `wf.add({ type: "...", ... })`
+        if (ts.isCallExpression(expr)) {
+            const call = expr;
+            const callee = call.expression;
+
+            // Must be `wf.XYZ(...)` — property access off the workflow var
+            if (
+                !ts.isPropertyAccessExpression(callee) ||
+                !ts.isIdentifier(callee.expression) ||
+                (workflowVar !== null && callee.expression.text !== workflowVar)
+            ) {
+                addError(
+                    origin,
+                    `Expected \`${workflowVar ?? "wf"}.addTyped(...)\` or \`${workflowVar ?? "wf"}.add(...)\`.`,
+                );
+                return;
+            }
+            if (!workflowVar) {
+                addError(origin, "Workflow must be constructed before adding nodes.");
+                return;
+            }
+
+            const method = callee.name.text;
+            if (method === "addTyped") {
+                handleAddTyped(varName, call, origin);
+            } else if (method === "add") {
+                handleAddGeneric(varName, call, origin);
+            } else {
+                addError(
+                    origin,
+                    `Unsupported method \`${method}\`. Use \`addTyped\` or \`add\`.`,
+                );
+            }
+            return;
+        }
+
+        addError(
+            origin,
+            "Only `new Workflow(...)`, `wf.addTyped(...)`, and `wf.add(...)` are allowed as binding initializers.",
+        );
+    }
+
+    function handleAddTyped(
+        varName: string,
+        call: ts.CallExpression,
+        origin: ts.Node,
+    ): void {
+        if (call.arguments.length < 1 || call.arguments.length > 2) {
+            addError(origin, "`addTyped` takes 1 or 2 arguments.");
+            return;
+        }
+        const inner = call.arguments[0]!;
+        if (!ts.isCallExpression(inner) || !ts.isIdentifier(inner.expression)) {
+            addError(
+                origin,
+                "`addTyped` must be called with a factory invocation, e.g. `addTyped(startCall({ ... }))`.",
+            );
+            return;
+        }
+        const factoryName = inner.expression.text;
+        if (!specByName.has(factoryName)) {
+            addError(
+                origin,
+                `Unknown node type: \`${factoryName}\`. Check the list of registered node types.`,
+            );
+            return;
+        }
+        const factoryArgs = inner.arguments;
+        let data: Record<string, unknown> = {};
+        if (factoryArgs.length > 0) {
+            const parsed = literalToJs(factoryArgs[0]!, addError);
+            if (parsed !== undefined) {
+                if (typeof parsed !== "object" || parsed === null || Array.isArray(parsed)) {
+                    addError(inner, "Factory argument must be an object literal.");
+                    return;
+                }
+                data = parsed as Record<string, unknown>;
+            }
+        }
+        // Optional position arg
+        const position = extractPositionArg(call.arguments[1], addError);
+        bindNode(varName, factoryName, data, position, origin);
+    }
+
+    function handleAddGeneric(
+        varName: string,
+        call: ts.CallExpression,
+        origin: ts.Node,
+    ): void {
+        if (call.arguments.length !== 1) {
+            addError(origin, "`add` takes exactly 1 object argument.");
+            return;
+        }
+        const parsed = literalToJs(call.arguments[0]!, addError);
+        if (parsed === undefined) return;
+        if (typeof parsed !== "object" || parsed === null || Array.isArray(parsed)) {
+            addError(origin, "`add` argument must be an object literal.");
+            return;
+        }
+        const obj = parsed as Record<string, unknown>;
+        const typeValue = obj["type"];
+        if (typeof typeValue !== "string") {
+            addError(origin, "`add({ type, ... })` requires a string `type` field.");
+            return;
+        }
+        if (!specByName.has(typeValue)) {
+            addError(origin, `Unknown node type: \`${typeValue}\`.`);
+            return;
+        }
+        let position: { x: number; y: number } | undefined;
+        if (obj["position"] !== undefined) {
+            const p = obj["position"];
+            if (
+                Array.isArray(p) &&
+                p.length === 2 &&
+                typeof p[0] === "number" &&
+                typeof p[1] === "number"
+            ) {
+                position = { x: p[0], y: p[1] };
+            } else {
+                addError(
+                    origin,
+                    "`position` must be a [x, y] tuple of numbers.",
+                );
+                return;
+            }
+        }
+        const { type: _ignored, position: _ignored2, ...rest } = obj;
+        bindNode(varName, typeValue, rest, position, origin);
+    }
+
+    function bindNode(
+        varName: string,
+        type: string,
+        data: Record<string, unknown>,
+        position: { x: number; y: number } | undefined,
+        origin: ts.Node,
+    ): void {
+        if (nodeRefs.has(varName)) {
+            addError(origin, `Variable \`${varName}\` is already bound.`);
+            return;
+        }
+        const node: WireNode = {
+            id: String(nextId++),
+            type,
+            position: position ?? { x: 0, y: 0 },
+            data,
+        };
+        nodes.push(node);
+        nodeRefs.set(varName, node);
+    }
+
+    function handleExpressionStatement(stmt: ts.ExpressionStatement): void {
+        const expr = unwrapAwait(stmt.expression);
+        if (!ts.isCallExpression(expr)) {
+            addError(stmt, "Only `wf.edge(...)` calls are allowed as bare statements.");
+            return;
+        }
+        const callee = expr.expression;
+        if (
+            !ts.isPropertyAccessExpression(callee) ||
+            !ts.isIdentifier(callee.expression) ||
+            (workflowVar !== null && callee.expression.text !== workflowVar) ||
+            callee.name.text !== "edge"
+        ) {
+            addError(stmt, "Only `wf.edge(source, target, opts)` is allowed as a bare statement.");
+            return;
+        }
+        if (expr.arguments.length !== 3) {
+            addError(stmt, "`edge` takes exactly 3 arguments: (source, target, opts).");
+            return;
+        }
+        const [srcArg, tgtArg, optsArg] = expr.arguments;
+        if (!ts.isIdentifier(srcArg!) || !ts.isIdentifier(tgtArg!)) {
+            addError(stmt, "`edge` source and target must be variable identifiers bound by `addTyped`/`add`.");
+            return;
+        }
+        const src = nodeRefs.get(srcArg.text);
+        const tgt = nodeRefs.get(tgtArg.text);
+        if (!src) {
+            addError(srcArg, `Unknown node variable: \`${srcArg.text}\`.`);
+            return;
+        }
+        if (!tgt) {
+            addError(tgtArg, `Unknown node variable: \`${tgtArg.text}\`.`);
+            return;
+        }
+        const opts = literalToJs(optsArg!, addError);
+        if (opts === undefined) return;
+        if (typeof opts !== "object" || opts === null || Array.isArray(opts)) {
+            addError(stmt, "`edge` options must be an object literal.");
+            return;
+        }
+        const optsObj = opts as Record<string, unknown>;
+        if (typeof optsObj["label"] !== "string" || (optsObj["label"] as string).trim() === "") {
+            addError(stmt, "`edge` requires a non-empty `label` string.");
+            return;
+        }
+        if (typeof optsObj["condition"] !== "string" || (optsObj["condition"] as string).trim() === "") {
+            addError(stmt, "`edge` requires a non-empty `condition` string.");
+            return;
+        }
+        edges.push({
+            id: `${src.id}-${tgt.id}`,
+            source: src.id,
+            target: tgt.id,
+            data: optsObj,
+        });
+    }
+
+    // ── terminate early on parse errors ──────────────────────────────
+    if (errors.length > 0) {
+        return { ok: false, stage: "parse", errors };
+    }
+
+    if (!workflowVar) {
+        return {
+            ok: false,
+            stage: "parse",
+            errors: [
+                {
+                    message:
+                        "No Workflow construction found. Expected `const wf = new Workflow({ name: \"...\" });`.",
+                },
+            ],
+        };
+    }
+
+    // ── spec-driven node validation ─────────────────────────────────
+    const validationErrors: ParseErrorItem[] = [];
+    for (const node of nodes) {
+        const spec = specByName.get(node.type)!;
+        const validated = validateNodeData(
+            spec,
+            node.data,
+            (msg) => validationErrors.push({ message: `[${node.type}] ${msg}` }),
+        );
+        if (validated !== null) node.data = validated;
+    }
+    if (validationErrors.length > 0) {
+        return { ok: false, stage: "validate", errors: validationErrors };
+    }
+
+    return {
+        ok: true,
+        workflow: {
+            nodes,
+            edges,
+            viewport: { x: 0, y: 0, zoom: 1 },
+        },
+        workflowName,
+    };
+}
+
+// ─── helpers ──────────────────────────────────────────────────────────
+
+function unwrapAwait(expr: ts.Expression): ts.Expression {
+    return ts.isAwaitExpression(expr) ? expr.expression : expr;
+}
+
+function extractPositionArg(
+    arg: ts.Expression | undefined,
+    addError: (n: ts.Node, m: string) => void,
+): { x: number; y: number } | undefined {
+    if (!arg) return undefined;
+    const parsed = literalToJs(arg, addError);
+    if (parsed === undefined || parsed === null) return undefined;
+    if (
+        typeof parsed === "object" &&
+        !Array.isArray(parsed) &&
+        Array.isArray((parsed as Record<string, unknown>)["position"])
+    ) {
+        const p = (parsed as Record<string, unknown>)["position"] as unknown[];
+        if (p.length === 2 && typeof p[0] === "number" && typeof p[1] === "number") {
+            return { x: p[0], y: p[1] };
+        }
+    }
+    addError(arg, "Optional second arg must be `{ position: [x, y] }`.");
+    return undefined;
+}
+
+// Convert an expression to a plain JS value. Accepts: string, number,
+// boolean, null, undefined (→ undefined), array/object literals of the
+// same. Rejects any expression with runtime semantics (identifiers other
+// than `true/false/null/undefined`, function calls, arrow fns, etc.).
+function literalToJs(
+    expr: ts.Expression,
+    addError: (n: ts.Node, m: string) => void,
+): unknown {
+    if (ts.isStringLiteral(expr) || ts.isNoSubstitutionTemplateLiteral(expr)) {
+        return expr.text;
+    }
+    if (ts.isNumericLiteral(expr)) return Number(expr.text);
+    if (expr.kind === ts.SyntaxKind.TrueKeyword) return true;
+    if (expr.kind === ts.SyntaxKind.FalseKeyword) return false;
+    if (expr.kind === ts.SyntaxKind.NullKeyword) return null;
+    if (ts.isIdentifier(expr) && expr.text === "undefined") return undefined;
+    if (ts.isPrefixUnaryExpression(expr)) {
+        if (expr.operator === ts.SyntaxKind.MinusToken) {
+            const inner = literalToJs(expr.operand, addError);
+            if (typeof inner === "number") return -inner;
+        }
+        if (expr.operator === ts.SyntaxKind.PlusToken) {
+            const inner = literalToJs(expr.operand, addError);
+            if (typeof inner === "number") return inner;
+        }
+        addError(expr, "Unsupported unary operator; only numeric negation is allowed.");
+        return undefined;
+    }
+    if (ts.isArrayLiteralExpression(expr)) {
+        const out: unknown[] = [];
+        for (const el of expr.elements) {
+            if (el.kind === ts.SyntaxKind.OmittedExpression) {
+                addError(el, "Sparse arrays are not allowed.");
+                return undefined;
+            }
+            if (ts.isSpreadElement(el)) {
+                addError(el, "Spread elements are not allowed in array literals.");
+                return undefined;
+            }
+            const v = literalToJs(el, addError);
+            if (v === undefined && el.kind !== ts.SyntaxKind.Identifier) {
+                return undefined;
+            }
+            out.push(v);
+        }
+        return out;
+    }
+    if (ts.isObjectLiteralExpression(expr)) {
+        const out: Record<string, unknown> = {};
+        for (const prop of expr.properties) {
+            if (!ts.isPropertyAssignment(prop)) {
+                addError(prop, "Only plain `key: value` properties are allowed (no methods, shorthand, spread, or computed keys).");
+                return undefined;
+            }
+            let key: string;
+            if (ts.isIdentifier(prop.name) || ts.isStringLiteral(prop.name)) {
+                key = prop.name.text;
+            } else {
+                addError(prop.name, "Property keys must be identifiers or string literals.");
+                return undefined;
+            }
+            const val = literalToJs(prop.initializer, addError);
+            if (val === undefined && prop.initializer.kind !== ts.SyntaxKind.Identifier) {
+                // treat explicit `undefined` as omission
+                continue;
+            }
+            out[key] = val;
+        }
+        return out;
+    }
+    if (ts.isTemplateExpression(expr)) {
+        addError(expr, "Template literals with interpolation are not allowed — use plain strings.");
+        return undefined;
+    }
+    addError(expr, `Unsupported expression (${ts.SyntaxKind[expr.kind]}). Only literals are allowed in data positions.`);
+    return undefined;
+}
+
+// Spec-driven validation, mirrors the shape of
+// `sdk/python/src/dograh_sdk/_validation.py` but lightweight — applies
+// defaults for missing optionals, catches unknown keys, enforces `options`
+// membership, and type-shapes the scalar and `fixed_collection` cases.
+function validateNodeData(
+    spec: NodeSpec,
+    data: Record<string, unknown>,
+    addError: (message: string) => void,
+): Record<string, unknown> | null {
+    const out: Record<string, unknown> = {};
+    const known = new Map<string, PropertySpec>();
+    for (const p of spec.properties ?? []) known.set(p.name, p);
+
+    for (const key of Object.keys(data)) {
+        if (!known.has(key)) {
+            addError(`Unknown field: \`${key}\`.`);
+            return null;
+        }
+    }
+
+    for (const [key, prop] of known) {
+        if (key in data) {
+            out[key] = data[key];
+        } else if (prop.default !== undefined && prop.default !== null) {
+            out[key] = prop.default;
+        } else if (prop.required) {
+            addError(`Missing required field: \`${key}\`.`);
+            return null;
+        }
+    }
+
+    for (const [key, prop] of known) {
+        if (!(key in out)) continue;
+        const value = out[key];
+        const err = checkPropertyShape(prop, value);
+        if (err) {
+            addError(`Field \`${key}\`: ${err}`);
+            return null;
+        }
+    }
+
+    return out;
+}
+
+function checkPropertyShape(prop: PropertySpec, value: unknown): string | null {
+    switch (prop.type) {
+        case "string":
+        case "mention_textarea":
+        case "url":
+        case "recording_ref":
+        case "credential_ref":
+            if (typeof value !== "string") return `expected string, got ${jsTypeOf(value)}.`;
+            return null;
+        case "number":
+            if (typeof value !== "number") return `expected number, got ${jsTypeOf(value)}.`;
+            return null;
+        case "boolean":
+            if (typeof value !== "boolean") return `expected boolean, got ${jsTypeOf(value)}.`;
+            return null;
+        case "tool_refs":
+        case "document_refs":
+        case "multi_options":
+            if (!Array.isArray(value)) return `expected array, got ${jsTypeOf(value)}.`;
+            for (const el of value) {
+                if (prop.type === "multi_options") {
+                    if (!isInOptions(prop, el)) {
+                        return `value \`${JSON.stringify(el)}\` is not in the allowed options.`;
+                    }
+                } else if (typeof el !== "string") {
+                    return `array elements must be strings.`;
+                }
+            }
+            return null;
+        case "options":
+            if (!isInOptions(prop, value)) {
+                return `value \`${JSON.stringify(value)}\` is not in the allowed options.`;
+            }
+            return null;
+        case "json":
+            if (typeof value !== "object" || value === null || Array.isArray(value)) {
+                return `expected JSON object, got ${jsTypeOf(value)}.`;
+            }
+            return null;
+        case "fixed_collection":
+            if (!Array.isArray(value)) return `expected array of rows, got ${jsTypeOf(value)}.`;
+            for (let i = 0; i < value.length; i++) {
+                const row = value[i];
+                if (typeof row !== "object" || row === null || Array.isArray(row)) {
+                    return `row ${i}: expected object, got ${jsTypeOf(row)}.`;
+                }
+                for (const sub of prop.properties ?? []) {
+                    const subVal = (row as Record<string, unknown>)[sub.name];
+                    if (subVal === undefined) {
+                        if (sub.required && (sub.default === undefined || sub.default === null)) {
+                            return `row ${i}: missing required field \`${sub.name}\`.`;
+                        }
+                        continue;
+                    }
+                    const subErr = checkPropertyShape(sub, subVal);
+                    if (subErr) return `row ${i}, \`${sub.name}\`: ${subErr}`;
+                }
+            }
+            return null;
+        default:
+            return null; // Unknown types pass — forward compat.
+    }
+}
+
+function isInOptions(prop: PropertySpec, value: unknown): boolean {
+    if (!prop.options) return true;
+    return prop.options.some((o) => o.value === value);
+}
+
+function jsTypeOf(v: unknown): string {
+    if (v === null) return "null";
+    if (Array.isArray(v)) return "array";
+    return typeof v;
+}
--- a/api/mcp_server/ts_validator/src/types.ts
+++ b/api/mcp_server/ts_validator/src/types.ts
@ -0,0 +1,57 @@
+// Shared shapes used by both generate and parse. Mirror the `ReactFlowDTO`
+// wire format on the Python side (`api/services/workflow/dto.py`) and the
+// node-spec JSON served by `/api/v1/node-types` / dumped by
+// `python -m api.services.workflow.node_specs`.
+
+export interface PropertyOption {
+    value: string | number | boolean;
+    label: string;
+}
+
+export interface PropertySpec {
+    name: string;
+    type: string;
+    required?: boolean;
+    default?: unknown;
+    options?: PropertyOption[];
+    properties?: PropertySpec[];
+}
+
+export interface NodeSpec {
+    name: string;
+    properties: PropertySpec[];
+}
+
+export interface WireNode {
+    id: string;
+    type: string;
+    position: { x: number; y: number };
+    data: Record<string, unknown>;
+}
+
+export interface WireEdge {
+    id: string;
+    source: string;
+    target: string;
+    data: Record<string, unknown>;
+}
+
+export interface WireWorkflow {
+    nodes: WireNode[];
+    edges: WireEdge[];
+    viewport: { x: number; y: number; zoom: number };
+}
+
+export interface ParseErrorItem {
+    message: string;
+    line?: number;
+    column?: number;
+}
+
+export type GenerateResult =
+    | { ok: true; code: string }
+    | { ok: false; errors: ParseErrorItem[] };
+
+export type ParseResult =
+    | { ok: true; workflow: WireWorkflow; workflowName: string }
+    | { ok: false; stage: "parse" | "validate"; errors: ParseErrorItem[] };
--- a/api/mcp_server/ts_validator/tsconfig.json
+++ b/api/mcp_server/ts_validator/tsconfig.json
@ -0,0 +1,14 @@
+{
+    "compilerOptions": {
+        "target": "ES2022",
+        "module": "ESNext",
+        "moduleResolution": "bundler",
+        "strict": true,
+        "esModuleInterop": true,
+        "allowImportingTsExtensions": true,
+        "skipLibCheck": true,
+        "noEmit": true,
+        "isolatedModules": true
+    },
+    "include": ["src/**/*.ts"]
+}
--- a/api/pytest.ini
+++ b/api/pytest.ini
@ -6,7 +6,7 @@ testpaths = tests
 python_files = test_*.py *_test.py
 python_classes = Test*
 python_functions = test_*
-addopts = -v --tb=short -s
+addopts = -v --tb=short -s --import-mode=importlib
 markers =
    asyncio: mark test as an async test
    slow: mark test as slow running
--- a/api/requirements.dev.txt
+++ b/api/requirements.dev.txt
@ -4,4 +4,6 @@ pytest==8.3.5
 pytest-asyncio==0.26.0
 pre-commit==4.2.0
 watchfiles==1.1.0
-python-dotenv==1.2.1
+python-dotenv==1.2.1
+datamodel-code-generator==0.56.1
+-e ./sdk/python
--- a/api/requirements.txt
+++ b/api/requirements.txt
@ -13,10 +13,8 @@ python-multipart==0.0.20
 sentry-sdk[fastapi]==2.38.0
 sqlalchemy[asyncio]==2.0.43
 msgpack==1.1.2
-docling[rapidocr]==2.68.0
 pgvector==0.4.2
 bcrypt==5.0.0
 email-validator==2.3.0
 posthog==7.11.1
 fastmcp==3.2.4
-rank-bm25==0.2.2
--- a/api/routes/credentials.py
+++ b/api/routes/credentials.py
@ -9,6 +9,7 @@ from pydantic import BaseModel
 from api.db import db_client
 from api.db.models import UserModel
 from api.enums import WebhookCredentialType
+from api.sdk_expose import sdk_expose
 from api.services.auth.depends import get_user

 router = APIRouter(prefix="/credentials")
@ -107,7 +108,13 @@ def build_credential_response(credential) -> CredentialResponse:
    )


-@router.get("/")
+@router.get(
+    "/",
+    **sdk_expose(
+        method="list_credentials",
+        description="List webhook credentials available to the authenticated organization.",
+    ),
+)
 async def list_credentials(
    user: UserModel = Depends(get_user),
 ) -> List[CredentialResponse]:
--- a/api/routes/knowledge_base.py
+++ b/api/routes/knowledge_base.py
@ -17,6 +17,7 @@ from api.schemas.knowledge_base import (
    DocumentUploadResponseSchema,
    ProcessDocumentRequestSchema,
 )
+from api.sdk_expose import sdk_expose
 from api.services.auth.depends import get_user
 from api.services.posthog_client import capture_event
 from api.services.storage import storage_fs
@ -135,6 +136,7 @@ async def process_document(
            document.id,
            request.s3_key,
            user.selected_organization_id,
+            str(user.provider_id),
            128,  # max_tokens (default)
            request.retrieval_mode,
        )
@ -190,6 +192,10 @@ async def process_document(
    "/documents",
    response_model=DocumentListResponseSchema,
    summary="List documents",
+    **sdk_expose(
+        method="list_documents",
+        description="List knowledge base documents available to the authenticated organization.",
+    ),
 )
 async def list_documents(
    status: Annotated[
--- a/api/routes/main.py
+++ b/api/routes/main.py
@ -8,6 +8,7 @@ from api.routes.credentials import router as credentials_router
 from api.routes.integration import router as integration_router
 from api.routes.knowledge_base import router as knowledge_base_router
 from api.routes.looptalk import router as looptalk_router
+from api.routes.node_types import router as node_types_router
 from api.routes.organization import router as organization_router
 from api.routes.organization_usage import router as organization_usage_router
 from api.routes.public_agent import router as public_agent_router
@ -54,6 +55,7 @@ router.include_router(workflow_embed_router)
 router.include_router(knowledge_base_router)
 router.include_router(workflow_recording_router)
 router.include_router(auth_router)
+router.include_router(node_types_router)


 class HealthResponse(BaseModel):
--- a/api/routes/node_types.py
+++ b/api/routes/node_types.py
@ -0,0 +1,67 @@
+"""API for the node-spec catalog.
+
+Exposes the registered NodeSpecs (one per node type) so frontend renderers
+and the LLM SDK can build forms / typed constructors from a single source
+of truth.
+
+Endpoints:
+    GET /node-types          → list every registered NodeSpec
+    GET /node-types/{name}   → single NodeSpec by name
+"""
+
+from fastapi import APIRouter, Depends, HTTPException
+from pydantic import BaseModel
+
+from api.db.models import UserModel
+from api.sdk_expose import sdk_expose
+from api.services.auth.depends import get_user
+from api.services.workflow.node_specs import (
+    SPEC_VERSION,
+    NodeSpec,
+    all_specs,
+    get_spec,
+)
+
+router = APIRouter(prefix="/node-types")
+
+
+class NodeTypesResponse(BaseModel):
+    spec_version: str
+    node_types: list[NodeSpec]
+
+
+@router.get(
+    "",
+    response_model=NodeTypesResponse,
+    **sdk_expose(
+        method="list_node_types",
+        description="List every registered node type with its spec. Pinned to spec_version.",
+    ),
+)
+async def list_node_types(
+    _user: UserModel = Depends(get_user),
+) -> NodeTypesResponse:
+    """List every registered NodeSpec.
+
+    SDK clients should pin to `spec_version` and warn if the server reports
+    a higher version than what they were generated against.
+    """
+    return NodeTypesResponse(spec_version=SPEC_VERSION, node_types=all_specs())
+
+
+@router.get(
+    "/{name}",
+    response_model=NodeSpec,
+    **sdk_expose(
+        method="get_node_type",
+        description="Fetch a single node spec by name.",
+    ),
+)
+async def get_node_type(
+    name: str,
+    _user: UserModel = Depends(get_user),
+) -> NodeSpec:
+    spec = get_spec(name)
+    if spec is None:
+        raise HTTPException(status_code=404, detail=f"Unknown node type: {name!r}")
+    return spec
--- a/api/routes/telephony.py
+++ b/api/routes/telephony.py
@ -29,6 +29,7 @@ from api.db.workflow_client import WorkflowClient
 from api.db.workflow_run_client import WorkflowRunClient
 from api.enums import CallType, OrganizationConfigurationKey, WorkflowRunState
 from api.errors.telephony_errors import TelephonyError
+from api.sdk_expose import sdk_expose
 from api.services.auth.depends import get_user
 from api.services.campaign.campaign_call_dispatcher import campaign_call_dispatcher
 from api.services.campaign.campaign_event_publisher import get_campaign_event_publisher
@ -139,7 +140,13 @@ class StatusCallbackRequest(BaseModel):
        )


-@router.post("/initiate-call")
+@router.post(
+    "/initiate-call",
+    **sdk_expose(
+        method="test_phone_call",
+        description="Place a test call from a workflow to a phone number.",
+    ),
+)
 async def initiate_call(
    request: InitiateCallRequest, user: UserModel = Depends(get_user)
 ):
--- a/api/routes/tool.py
+++ b/api/routes/tool.py
@ -10,6 +10,7 @@ from pydantic import BaseModel, Field, field_validator
 from api.db import db_client
 from api.db.models import UserModel
 from api.enums import PostHogEvent, ToolCategory, ToolStatus
+from api.sdk_expose import sdk_expose
 from api.services.auth.depends import get_user
 from api.services.posthog_client import capture_event

@ -276,7 +277,13 @@ def validate_status(status: str) -> None:
            )


-@router.get("/")
+@router.get(
+    "/",
+    **sdk_expose(
+        method="list_tools",
+        description="List tools available to the authenticated organization.",
+    ),
+)
 async def list_tools(
    status: Optional[str] = None,
    category: Optional[str] = None,
--- a/api/routes/workflow.py
+++ b/api/routes/workflow.py
@ -16,6 +16,7 @@ from api.db.models import UserModel
 from api.db.workflow_template_client import WorkflowTemplateClient
 from api.enums import CallType, PostHogEvent, StorageBackend
 from api.schemas.workflow import WorkflowRunResponseSchema
+from api.sdk_expose import sdk_expose
 from api.services.auth.depends import get_user
 from api.services.campaign.report import generate_workflow_report_csv
 from api.services.configuration.check_validity import UserConfigurationValidator
@ -27,7 +28,7 @@ from api.services.configuration.resolve import resolve_effective_config
 from api.services.mps_service_key_client import mps_service_key_client
 from api.services.posthog_client import capture_event
 from api.services.storage import storage_fs
-from api.services.workflow.dto import ReactFlowDTO
+from api.services.workflow.dto import ReactFlowDTO, sanitize_workflow_definition
 from api.services.workflow.duplicate import duplicate_workflow
 from api.services.workflow.errors import ItemKind, WorkflowError
 from api.services.workflow.workflow import WorkflowGraph
@ -453,7 +454,13 @@ async def get_workflow_count(
    )


-@router.get("/fetch")
+@router.get(
+    "/fetch",
+    **sdk_expose(
+        method="list_workflows",
+        description="List all workflows in the authenticated organization.",
+    ),
+)
 async def get_workflows(
    user: UserModel = Depends(get_user),
    status: Optional[str] = Query(
@ -499,7 +506,13 @@ async def get_workflows(
    ]


-@router.get("/fetch/{workflow_id}")
+@router.get(
+    "/fetch/{workflow_id}",
+    **sdk_expose(
+        method="get_workflow",
+        description="Get a single workflow by ID (returns draft if one exists, else published).",
+    ),
+)
 async def get_workflow(
    workflow_id: int,
    user: UserModel = Depends(get_user),
@ -701,7 +714,13 @@ async def update_workflow_status(
        raise HTTPException(status_code=500, detail=str(e))


-@router.put("/{workflow_id}")
+@router.put(
+    "/{workflow_id}",
+    **sdk_expose(
+        method="update_workflow",
+        description="Update a workflow's name and/or definition. Saves as a new draft.",
+    ),
+)
 async def update_workflow(
    workflow_id: int,
    request: UpdateWorkflowRequest,
@ -721,8 +740,10 @@ async def update_workflow(
        HTTPException: If the workflow is not found or if there's a database error
    """
    try:
-        # Restore real API keys where the incoming definition has masked placeholders
-        workflow_definition = request.workflow_definition
+        # Strip UI runtime-only fields (invalid, validationMessage, etc.) from
+        # node.data / edge.data before anything touches the DB — the UI sends
+        # nodes wholesale from the React Flow store, which carries those.
+        workflow_definition = sanitize_workflow_definition(request.workflow_definition)
        if workflow_definition:
            existing_workflow = await db_client.get_workflow(
                workflow_id, organization_id=user.selected_organization_id
--- a/api/routes/workflow_recording.py
+++ b/api/routes/workflow_recording.py
@ -19,6 +19,7 @@ from api.schemas.workflow_recording import (
    RecordingUpdateRequestSchema,
    RecordingUploadResponseSchema,
 )
+from api.sdk_expose import sdk_expose
 from api.services.auth.depends import get_user
 from api.services.mps_service_key_client import mps_service_key_client
 from api.services.storage import storage_fs
@ -165,6 +166,10 @@ async def create_recordings(
    "/",
    response_model=RecordingListResponseSchema,
    summary="List recordings",
+    **sdk_expose(
+        method="list_recordings",
+        description="List workflow recordings available to the authenticated organization.",
+    ),
 )
 async def list_recordings(
    workflow_id: Annotated[
--- a/api/sdk_expose.py
+++ b/api/sdk_expose.py
@ -0,0 +1,38 @@
+"""Opt-in marker for exposing a FastAPI route through the Dograh SDK.
+
+The generated SDK client (`sdk/python/src/dograh_sdk/_generated_client.py`
+and the TypeScript equivalent) is built by walking the backend's OpenAPI
+schema and picking up any operation tagged with `x-sdk-method`. That
+means `generate_sdk.sh` stays in sync with the real HTTP paths — no more
+hand-typed URL strings drifting out of date.
+
+Usage:
+
+    from api.sdk_expose import sdk_expose
+
+    @router.post("/initiate-call", **sdk_expose(
+        method="test_phone_call",
+        description="Place a test call from a workflow to a phone number.",
+    ))
+    async def initiate_call(...): ...
+
+Anything not wrapped in `sdk_expose` is invisible to the SDK — deliberate,
+so the SDK surface stays small and auditable.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+
+def sdk_expose(*, method: str, description: str = "") -> dict[str, Any]:
+    """Return FastAPI route kwargs that tag the operation for SDK codegen.
+
+    `method` becomes the SDK method name in both Python and TypeScript
+    (converted to snake_case / camelCase as appropriate by the codegen).
+    `description` is emitted as the method docstring.
+    """
+    extra: dict[str, Any] = {"x-sdk-method": method}
+    if description:
+        extra["x-sdk-description"] = description
+    return {"openapi_extra": extra}
--- a/api/services/gen_ai/embedding/openai_service.py
+++ b/api/services/gen_ai/embedding/openai_service.py
@ -1,35 +1,22 @@
 """OpenAI embedding service.

-This module provides document processing capabilities using:
- OpenAI's text-embedding-3-small for embeddings (1536 dimensions)
- Docling for document conversion and chunking
- pgvector for vector similarity search
+Embeds text and performs vector similarity search via the local database.
+Document conversion and chunking now live in the Model Proxy Service (MPS);
+this file no longer pulls docling/transformers.
 """

-import os
-from pathlib import Path
 from typing import Any, Dict, List, Optional

-from docling.chunking import HybridChunker
-from docling.document_converter import DocumentConverter
-from docling_core.transforms.chunker.tokenizer.huggingface import HuggingFaceTokenizer
 from loguru import logger
 from openai import AsyncOpenAI
-from transformers import AutoTokenizer

 from api.db.db_client import DBClient
-from api.db.models import KnowledgeBaseChunkModel

 from .base import BaseEmbeddingService

-# Model configuration
 DEFAULT_MODEL_ID = "text-embedding-3-small"
 EMBEDDING_DIMENSION = 1536  # Dimension for text-embedding-3-small

-# For chunking, we'll use the same tokenizer as SentenceTransformer
-# since OpenAI uses similar tokenization
-TOKENIZER_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
-

 class EmbeddingAPIKeyNotConfiguredError(Exception):
    """Raised when OpenAI API key is not configured for embeddings."""
@ -49,24 +36,20 @@ class OpenAIEmbeddingService(BaseEmbeddingService):
        db_client: DBClient,
        api_key: Optional[str] = None,
        model_id: str = DEFAULT_MODEL_ID,
-        max_tokens: int = 512,
        base_url: Optional[str] = None,
    ):
        """Initialize the OpenAI embedding service.

        Args:
-            db_client: Database client for storing documents and chunks
+            db_client: Database client for vector similarity search.
            api_key: OpenAI API key. If not provided, the client will not be
-                    initialized and operations will fail with a clear error.
-            model_id: OpenAI embedding model ID (default: text-embedding-3-small)
-            max_tokens: Maximum number of tokens per chunk (default: 512)
-            base_url: Optional base URL for the API (e.g. for OpenRouter)
+                initialized and operations will fail with a clear error.
+            model_id: OpenAI embedding model ID (default: text-embedding-3-small).
+            base_url: Optional base URL for the API (e.g. for OpenRouter).
        """
        self.db = db_client
        self.model_id = model_id
-        self.max_tokens = max_tokens

-        # Only initialize OpenAI client if API key is provided
        self._api_key_configured = bool(api_key)
        if self._api_key_configured:
            client_kwargs = {"api_key": api_key}
@ -81,35 +64,6 @@ class OpenAIEmbeddingService(BaseEmbeddingService):
                "Operations will fail until API key is configured in Model Configurations."
            )

-        # Initialize tokenizer for chunking
-        # We use a HuggingFace tokenizer for consistent chunking
-        logger.info(
-            f"Loading tokenizer for chunking: {TOKENIZER_MODEL} with max_tokens={max_tokens}"
-        )
-        try:
-            self.tokenizer = HuggingFaceTokenizer(
-                tokenizer=AutoTokenizer.from_pretrained(
-                    TOKENIZER_MODEL,
-                    local_files_only=True,
-                ),
-                max_tokens=max_tokens,
-            )
-            logger.info("Loaded tokenizer from cache")
-        except Exception as e:
-            logger.warning(f"Tokenizer not in cache, downloading: {e}")
-            self.tokenizer = HuggingFaceTokenizer(
-                tokenizer=AutoTokenizer.from_pretrained(TOKENIZER_MODEL),
-                max_tokens=max_tokens,
-            )
-            logger.info("Tokenizer downloaded and cached")
-
-        # Initialize chunker
-        logger.info(f"Initializing HybridChunker with max_tokens={max_tokens}")
-        self.chunker = HybridChunker(tokenizer=self.tokenizer)
-
-        # Initialize document converter
-        self.converter = DocumentConverter()
-
    def get_model_id(self) -> str:
        """Return the model identifier."""
        return self.model_id
@ -126,28 +80,17 @@ class OpenAIEmbeddingService(BaseEmbeddingService):
    async def embed_texts(self, texts: List[str]) -> List[List[float]]:
        """Embed a batch of texts using OpenAI API.

-        Args:
-            texts: List of text strings to embed
-
-        Returns:
-            List of embedding vectors (each vector is a list of floats)
-
        Raises:
-            EmbeddingAPIKeyNotConfiguredError: If API key is not configured
+            EmbeddingAPIKeyNotConfiguredError: If API key is not configured.
        """
        self._ensure_api_key_configured()

        try:
-            # OpenAI API call
            response = await self.client.embeddings.create(
                input=texts,
                model=self.model_id,
            )
-
-            # Extract embeddings from response
-            embeddings = [item.embedding for item in response.data]
-            return embeddings
-
+            return [item.embedding for item in response.data]
        except Exception as e:
            logger.error(f"Error generating OpenAI embeddings: {e}")
            raise
@ -155,14 +98,8 @@ class OpenAIEmbeddingService(BaseEmbeddingService):
    async def embed_query(self, query: str) -> List[float]:
        """Embed a single query text using OpenAI API.

-        Args:
-            query: Query text to embed
-
-        Returns:
-            Embedding vector as list of floats
-
        Raises:
-            EmbeddingAPIKeyNotConfiguredError: If API key is not configured
+            EmbeddingAPIKeyNotConfiguredError: If API key is not configured.
        """
        self._ensure_api_key_configured()
        embeddings = await self.embed_texts([query])
@ -177,201 +114,17 @@ class OpenAIEmbeddingService(BaseEmbeddingService):
    ) -> List[Dict[str, Any]]:
        """Search for similar chunks using vector similarity.

-        Args:
-            query: Search query text
-            organization_id: Organization ID for scoping
-            limit: Maximum number of results to return
-            document_uuids: Optional list of document UUIDs to filter by
-
-        Returns:
-            List of dictionaries with chunk data and similarity scores
-
        Raises:
-            EmbeddingAPIKeyNotConfiguredError: If API key is not configured
+            EmbeddingAPIKeyNotConfiguredError: If API key is not configured.
        """
        self._ensure_api_key_configured()

-        # Generate query embedding
        query_embedding = await self.embed_query(query)

-        # Perform vector similarity search
-        results = await self.db.search_similar_chunks(
+        return await self.db.search_similar_chunks(
            query_embedding=query_embedding,
            organization_id=organization_id,
            limit=limit,
            document_uuids=document_uuids,
            embedding_model=self.model_id,
        )
-
-        return results
-
-    async def process_document(
-        self,
-        file_path: str,
-        organization_id: int,
-        created_by: int,
-        custom_metadata: dict = None,
-    ):
-        """Process a document: convert, chunk, embed, and store in database.
-
-        Args:
-            file_path: Path to the document file
-            organization_id: Organization ID for scoping
-            created_by: User ID who uploaded the document
-            custom_metadata: Optional custom metadata dictionary
-
-        Returns:
-            The created document record
-        """
-        try:
-            # Extract file metadata
-            filename = Path(file_path).name
-            file_hash = self.db.compute_file_hash(file_path)
-            file_size = os.path.getsize(file_path)
-            mime_type = self.db.get_mime_type(file_path)
-
-            # Check if document already exists
-            existing_doc = await self.db.get_document_by_hash(
-                file_hash, organization_id
-            )
-            if existing_doc:
-                logger.info(f"Document already exists: {filename} (hash: {file_hash})")
-                return existing_doc
-
-            # Create document record
-            doc_record = await self.db.create_document(
-                organization_id=organization_id,
-                created_by=created_by,
-                filename=filename,
-                file_size_bytes=file_size,
-                file_hash=file_hash,
-                mime_type=mime_type,
-                custom_metadata=custom_metadata or {},
-            )
-
-            logger.info(f"Processing document with OpenAI embeddings: {filename}")
-
-            # Update status to processing
-            await self.db.update_document_status(doc_record.id, "processing")
-
-            # Step 1: Convert document using docling
-            logger.info("Converting document with docling...")
-            conversion_result = self.converter.convert(file_path)
-            doc = conversion_result.document
-
-            # Store docling metadata
-            docling_metadata = {
-                "num_pages": len(doc.pages) if hasattr(doc, "pages") else None,
-                "document_type": type(doc).__name__,
-            }
-
-            # Step 2: Chunk the document
-            logger.info(f"Chunking document with max_tokens={self.max_tokens}...")
-            chunks = list(self.chunker.chunk(dl_doc=doc))
-            total_chunks = len(chunks)
-
-            logger.info(f"Generated {total_chunks} chunks")
-
-            # Step 3: Process each chunk
-            chunk_texts = []
-            chunk_records = []
-            token_counts = []
-
-            for i, chunk in enumerate(chunks):
-                # Get chunk text
-                chunk_text = chunk.text
-
-                # Get contextualized text
-                contextualized_text = self.chunker.contextualize(chunk=chunk)
-
-                # Calculate token count
-                text_to_tokenize = (
-                    contextualized_text if contextualized_text else chunk_text
-                )
-                token_count = len(
-                    self.tokenizer.tokenizer.encode(
-                        text_to_tokenize, add_special_tokens=False
-                    )
-                )
-                token_counts.append(token_count)
-
-                # Prepare chunk metadata
-                chunk_metadata = {}
-                if hasattr(chunk, "meta") and chunk.meta:
-                    chunk_metadata = {
-                        "doc_items": (
-                            [str(item) for item in chunk.meta.doc_items]
-                            if hasattr(chunk.meta, "doc_items")
-                            else []
-                        ),
-                        "headings": (
-                            chunk.meta.headings
-                            if hasattr(chunk.meta, "headings")
-                            else []
-                        ),
-                    }
-
-                # Create chunk record (without embedding yet)
-                chunk_record = KnowledgeBaseChunkModel(
-                    document_id=doc_record.id,
-                    organization_id=organization_id,
-                    chunk_text=chunk_text,
-                    contextualized_text=contextualized_text,
-                    chunk_index=i,
-                    chunk_metadata=chunk_metadata,
-                    embedding_model=self.model_id,
-                    embedding_dimension=EMBEDDING_DIMENSION,
-                    token_count=token_count,
-                )
-
-                chunk_records.append(chunk_record)
-                chunk_texts.append(text_to_tokenize)
-
-            # Log chunk statistics
-            if token_counts:
-                avg_tokens = sum(token_counts) / len(token_counts)
-                min_tokens = min(token_counts)
-                max_tokens = max(token_counts)
-                logger.info("Chunk token statistics:")
-                logger.info(f"  - Average: {avg_tokens:.1f} tokens")
-                logger.info(f"  - Min: {min_tokens} tokens")
-                logger.info(f"  - Max: {max_tokens} tokens")
-
-            # Step 4: Generate embeddings using OpenAI API
-            logger.info(f"Generating embeddings using OpenAI ({self.model_id})...")
-            embeddings = await self.embed_texts(chunk_texts)
-
-            # Step 5: Attach embeddings to chunk records
-            for chunk_record, embedding in zip(chunk_records, embeddings):
-                chunk_record.embedding = embedding
-
-            # Step 6: Save all chunks in batch
-            logger.info("Storing chunks in database...")
-            await self.db.create_chunks_batch(chunk_records)
-
-            # Update document status to completed
-            await self.db.update_document_status(
-                doc_record.id,
-                "completed",
-                total_chunks=total_chunks,
-                docling_metadata=docling_metadata,
-            )
-
-            logger.info(f"Successfully processed document: {filename}")
-            logger.info(f"  - Total chunks: {total_chunks}")
-            logger.info(f"  - Embedding model: {self.model_id}")
-            logger.info(f"  - Document ID: {doc_record.id}")
-            logger.info(f"  - Document UUID: {doc_record.document_uuid}")
-
-            return doc_record
-
-        except Exception as e:
-            logger.error(f"Error processing document with OpenAI: {e}")
-
-            # Update document status to failed if it exists
-            if "doc_record" in locals():
-                await self.db.update_document_status(
-                    doc_record.id, "failed", error_message=str(e)
-                )
-
-            raise
--- a/api/services/mps_service_key_client.py
+++ b/api/services/mps_service_key_client.py
@ -487,6 +487,71 @@ class MPSServiceKeyClient:
                    response=response,
                )

+    async def process_document(
+        self,
+        file_path: str,
+        filename: str,
+        content_type: str,
+        retrieval_mode: str = "chunked",
+        max_tokens: int = 128,
+        chunk_overlap_tokens: int = 0,
+        merge_peers: bool = True,
+        tokenizer_model: Optional[str] = None,
+        correlation_id: Optional[str] = None,
+        organization_id: Optional[int] = None,
+        created_by: Optional[str] = None,
+    ) -> dict:
+        """Convert + chunk a document via MPS /document/process.
+
+        Returns a dict matching DocumentProcessResponse in MPS:
+            {
+              "mode": "chunked" | "full_document",
+              "docling_metadata": {...},
+              "full_text": str | None,   # populated only in full_document mode
+              "chunks": [...],           # populated only in chunked mode
+            }
+
+        Timeout is 300s to match the ALB idle_timeout configured in
+        infrastructure/mps/main.tf. Raises on non-2xx responses.
+        """
+        data = {
+            "retrieval_mode": retrieval_mode,
+            "max_tokens": str(max_tokens),
+            "chunk_overlap_tokens": str(chunk_overlap_tokens),
+            "merge_peers": str(merge_peers).lower(),
+        }
+        if tokenizer_model is not None:
+            data["tokenizer_model"] = tokenizer_model
+        if correlation_id:
+            data["correlation_id"] = correlation_id
+
+        headers = self._get_headers(organization_id, created_by)
+        # Remove JSON content-type so httpx sets the correct multipart boundary.
+        headers.pop("Content-Type", None)
+
+        async with httpx.AsyncClient(timeout=httpx.Timeout(300.0)) as client:
+            with open(file_path, "rb") as fh:
+                files = {"file": (filename, fh.read(), content_type)}
+
+            response = await client.post(
+                f"{self.base_url}/api/v1/document/process",
+                files=files,
+                data=data,
+                headers=headers,
+            )
+
+            if response.status_code == 200:
+                return response.json()
+
+            logger.error(
+                f"Failed to process document: {response.status_code} - {response.text}"
+            )
+            raise httpx.HTTPStatusError(
+                f"Failed to process document: {response.text}",
+                request=response.request,
+                response=response,
+            )
+
    async def call_workflow_api(
        self,
        call_type: str,
--- a/api/services/pipecat/audio_playback.py
+++ b/api/services/pipecat/audio_playback.py
@ -97,6 +97,7 @@ async def play_audio(
    queue_frame: Callable[[Frame], Awaitable[None]],
    transcript: Optional[str] = None,
    append_to_context: bool = False,
+    persist_to_logs: bool = False,
 ) -> None:
    """Play raw PCM-16 audio once.

@ -115,6 +116,8 @@ async def play_audio(
        transcript: Optional transcript of the recording.
        append_to_context: Whether the transcript should be appended to
            the LLM assistant context.  Defaults to False.
+        persist_to_logs: Whether the transcript should be written to the
+            app-level logs buffer by observers. Defaults to False.
    """
    context_id = str(uuid.uuid4())
    await queue_frame(TTSStartedFrame(context_id=context_id))
@ -123,6 +126,7 @@ async def play_audio(
            text=transcript, aggregated_by="recording", context_id=context_id
        )
        tts_text.append_to_context = append_to_context
+        tts_text.persist_to_logs = persist_to_logs
        await queue_frame(tts_text)
    await queue_frame(
        TTSAudioRawFrame(
--- a/api/services/pipecat/realtime_feedback_observer.py
+++ b/api/services/pipecat/realtime_feedback_observer.py
@ -42,6 +42,7 @@ from pipecat.frames.frames import (
    MetricsFrame,
    StopFrame,
    TranscriptionFrame,
+    TTSSpeakFrame,
    TTSTextFrame,
    UserMuteStartedFrame,
    UserMuteStoppedFrame,
@ -230,8 +231,22 @@ class RealtimeFeedbackObserver(BaseObserver):
                    },
                }
            )
+        # Handle engine-queued speech (transition/tool messages) marked for
+        # log persistence. The downstream TTSTextFrame(s) from the TTS service
+        # still stream to WS as normal; we persist the full utterance once here
+        # to avoid word-level log entries from word-timestamp providers.
+        elif isinstance(frame, TTSSpeakFrame):
+            if getattr(frame, "persist_to_logs", False):
+                await self._append_to_buffer(
+                    {
+                        "type": RealtimeFeedbackType.BOT_TEXT.value,
+                        "payload": {"text": frame.text},
+                    }
+                )
        # Handle bot TTS text - respect pts timing, WebSocket only
-        # Complete turn text is persisted via register_turn_handlers
+        # Complete turn text is persisted via register_turn_handlers,
+        # except for frames explicitly flagged persist_to_logs (e.g. recording
+        # transcripts from play_audio) which bypass the aggregator path.
        elif isinstance(frame, TTSTextFrame):
            message = {
                "type": RealtimeFeedbackType.BOT_TEXT.value,
@ -249,6 +264,9 @@ class RealtimeFeedbackObserver(BaseObserver):

                await self._ensure_clock_task()
                await self._clock_queue.put((frame.pts, frame.id, message))
+            elif getattr(frame, "persist_to_logs", False):
+                # No pts + explicit persistence request (recording transcript).
+                await self._send_message(message)
            else:
                # No pts, send immediately
                await self._send_ws(message)
--- a/api/services/pipecat/tracing_config.py
+++ b/api/services/pipecat/tracing_config.py
@ -94,6 +94,14 @@ class _OrgRoutingExporter(SpanExporter):
        org_buckets = {}

        for span in spans:
+            # Drop fastmcp's built-in auto-instrumentation spans
+            # (`tools/call <name>`, etc.) — our `@traced_tool` decorator
+            # in `api/mcp_server/tracing.py` produces the spans we want. Keeping
+            # both would just double every trace.
+            scope = getattr(span, "instrumentation_scope", None)
+            if scope is not None and scope.name == "fastmcp":
+                continue
+
            org_id = span.attributes.get("dograh.org_id") if span.attributes else None
            if org_id and str(org_id) in self._org_exporters:
                org_buckets.setdefault(str(org_id), []).append(span)
--- a/api/services/workflow/dto.py
+++ b/api/services/workflow/dto.py
@ -1,5 +1,5 @@
 from enum import Enum
-from typing import List, Optional
+from typing import Annotated, List, Literal, Optional, Union

 from pydantic import BaseModel, Field, ValidationError, model_validator

@ -42,17 +42,48 @@ class RetryConfigDTO(BaseModel):
    retry_delay_seconds: int = 5


-class NodeDataDTO(BaseModel):
+# ─────────────────────────────────────────────────────────────────────────
+# Per-type node data classes.
+#
+# Shared fields are factored out as Pydantic mixins; per-type classes
+# inherit only the mixins they need so mistyped fields raise at validation
+# time and downstream consumers get accurate types. `is_start` / `is_end`
+# live on every variant so the WorkflowGraph can identify boundary nodes
+# without dispatching on type.
+# ─────────────────────────────────────────────────────────────────────────
+
+
+class _NodeDataBase(BaseModel):
    name: str = Field(..., min_length=1)
-    prompt: Optional[str] = Field(default=None)
-    is_static: bool = False
    is_start: bool = False
    is_end: bool = False
+
+
+class _PromptedNodeDataMixin(BaseModel):
+    prompt: Optional[str] = Field(default=None)
+    is_static: bool = False
    allow_interrupt: bool = False
+    add_global_prompt: bool = True
+
+
+class _ExtractionNodeDataMixin(BaseModel):
    extraction_enabled: bool = False
    extraction_prompt: Optional[str] = None
    extraction_variables: Optional[list[ExtractionVariableDTO]] = None
-    add_global_prompt: bool = True
+
+
+class _ToolDocumentRefsMixin(BaseModel):
+    tool_uuids: Optional[List[str]] = None
+    document_uuids: Optional[List[str]] = None
+
+
+class StartCallNodeData(
+    _NodeDataBase,
+    _PromptedNodeDataMixin,
+    _ExtractionNodeDataMixin,
+    _ToolDocumentRefsMixin,
+):
+    is_start: bool = True
    greeting: Optional[str] = None
    greeting_type: Optional[str] = None  # 'text' or 'audio'
    greeting_recording_id: Optional[str] = None
@ -61,14 +92,38 @@ class NodeDataDTO(BaseModel):
    detect_voicemail: bool = False
    delayed_start: bool = False
    delayed_start_duration: Optional[float] = None
-    # Pre-call fetch (start node only)
    pre_call_fetch_enabled: bool = False
    pre_call_fetch_url: Optional[str] = None
    pre_call_fetch_credential_uuid: Optional[str] = None
-    tool_uuids: Optional[List[str]] = None
-    document_uuids: Optional[List[str]] = None
+
+
+class AgentNodeData(
+    _NodeDataBase,
+    _PromptedNodeDataMixin,
+    _ExtractionNodeDataMixin,
+    _ToolDocumentRefsMixin,
+):
+    pass
+
+
+class EndCallNodeData(
+    _NodeDataBase,
+    _PromptedNodeDataMixin,
+    _ExtractionNodeDataMixin,
+):
+    is_end: bool = True
+
+
+class GlobalNodeData(_NodeDataBase, _PromptedNodeDataMixin):
+    pass
+
+
+class TriggerNodeData(_NodeDataBase):
    trigger_path: Optional[str] = None
-    # Webhook node specific fields
+    enabled: bool = True
+
+
+class WebhookNodeData(_NodeDataBase):
    enabled: bool = True
    http_method: Optional[str] = None
    endpoint_url: Optional[str] = None
@ -76,30 +131,129 @@ class NodeDataDTO(BaseModel):
    custom_headers: Optional[list[CustomHeaderDTO]] = None
    payload_template: Optional[dict] = None
    retry_config: Optional[RetryConfigDTO] = None
-    # QA node specific fields
+
+
+class QANodeData(_NodeDataBase):
    qa_enabled: bool = True
-    qa_system_prompt: Optional[str] = None
+    qa_use_workflow_llm: bool = True
+    qa_provider: Optional[str] = None
    qa_model: Optional[str] = None
+    qa_api_key: Optional[str] = None
+    qa_endpoint: Optional[str] = None
+    qa_system_prompt: Optional[str] = None
    qa_min_call_duration: int = 15
    qa_voicemail_calls: bool = False
    qa_sample_rate: int = 100


-class RFNodeDTO(BaseModel):
+# Union of every per-type data class — useful as a type annotation on
+# consumers that handle any node data without dispatching on type. Cannot
+# be called as a constructor; use the per-type class directly.
+NodeDataDTO = Union[
+    StartCallNodeData,
+    AgentNodeData,
+    EndCallNodeData,
+    GlobalNodeData,
+    TriggerNodeData,
+    WebhookNodeData,
+    QANodeData,
+]
+
+
+# ─────────────────────────────────────────────────────────────────────────
+# Per-type RF nodes.
+#
+# RFNodeDTO is a discriminated Union over `type`. Pydantic dispatches to
+# the right variant when validating wire JSON. Direct instantiation must
+# use the concrete per-type class (StartCallRFNode, AgentRFNode, ...).
+# ─────────────────────────────────────────────────────────────────────────
+
+
+class _RFNodeBase(BaseModel):
    id: str
-    type: NodeType = Field(default=NodeType.agentNode)
    position: Position
-    data: NodeDataDTO
+
+
+def _require_prompt(data, type_label: str) -> None:
+    prompt = getattr(data, "prompt", None)
+    if not prompt or len(prompt.strip()) == 0:
+        raise ValueError(f"Prompt is required for {type_label} nodes")
+
+
+class StartCallRFNode(_RFNodeBase):
+    type: Literal["startCall"] = "startCall"
+    data: StartCallNodeData

    @model_validator(mode="after")
-    def _validate_prompt_required(self):
-        """Require prompt for all node types except trigger, webhook, and qa."""
-        if self.type not in (NodeType.trigger, NodeType.webhook, NodeType.qa):
-            if not self.data.prompt or len(self.data.prompt.strip()) == 0:
-                raise ValueError("Prompt is required for non-trigger nodes")
+    def _validate(self):
+        _require_prompt(self.data, "start")
        return self


+class AgentRFNode(_RFNodeBase):
+    type: Literal["agentNode"] = "agentNode"
+    data: AgentNodeData
+
+    @model_validator(mode="after")
+    def _validate(self):
+        _require_prompt(self.data, "agent")
+        return self
+
+
+class EndCallRFNode(_RFNodeBase):
+    type: Literal["endCall"] = "endCall"
+    data: EndCallNodeData
+
+    @model_validator(mode="after")
+    def _validate(self):
+        _require_prompt(self.data, "end")
+        return self
+
+
+class GlobalRFNode(_RFNodeBase):
+    type: Literal["globalNode"] = "globalNode"
+    data: GlobalNodeData
+
+    @model_validator(mode="after")
+    def _validate(self):
+        _require_prompt(self.data, "global")
+        return self
+
+
+class TriggerRFNode(_RFNodeBase):
+    type: Literal["trigger"] = "trigger"
+    data: TriggerNodeData
+
+
+class WebhookRFNode(_RFNodeBase):
+    type: Literal["webhook"] = "webhook"
+    data: WebhookNodeData
+
+
+class QARFNode(_RFNodeBase):
+    type: Literal["qa"] = "qa"
+    data: QANodeData
+
+
+RFNodeDTO = Annotated[
+    Union[
+        StartCallRFNode,
+        AgentRFNode,
+        EndCallRFNode,
+        GlobalRFNode,
+        TriggerRFNode,
+        WebhookRFNode,
+        QARFNode,
+    ],
+    Field(discriminator="type"),
+]
+
+
+# ─────────────────────────────────────────────────────────────────────────
+# Edges
+# ─────────────────────────────────────────────────────────────────────────
+
+
 class EdgeDataDTO(BaseModel):
    label: str = Field(..., min_length=1)
    condition: str = Field(..., min_length=1)
@ -144,3 +298,60 @@ class ReactFlowDTO(BaseModel):
            )

        return self
+
+
+# Node type → per-type data class. Keeps sanitize_workflow_definition in
+# step with RFNodeDTO's discriminated union.
+_NODE_DATA_CLASSES: dict[str, type[BaseModel]] = {
+    NodeType.startNode.value: StartCallNodeData,
+    NodeType.agentNode.value: AgentNodeData,
+    NodeType.endNode.value: EndCallNodeData,
+    NodeType.globalNode.value: GlobalNodeData,
+    NodeType.trigger.value: TriggerNodeData,
+    NodeType.webhook.value: WebhookNodeData,
+    NodeType.qa.value: QANodeData,
+}
+
+
+def sanitize_workflow_definition(definition: dict | None) -> dict | None:
+    """Strip unknown fields from each node.data and edge.data so UI-only
+    runtime state (`invalid`, `validationMessage`, etc.) doesn't leak into
+    persisted workflow JSON.
+
+    Only `.data` is filtered — top-level keys on nodes/edges/definition
+    (viewport, ReactFlow-computed width/height, etc.) are preserved as-is.
+    This is a stripper, not a validator: it doesn't enforce required fields
+    or run model_validators, so partial drafts save cleanly.
+    """
+    if not definition:
+        return definition
+
+    out = dict(definition)
+    raw_nodes = out.get("nodes")
+    if isinstance(raw_nodes, list):
+        out["nodes"] = [_sanitize_node(n) for n in raw_nodes]
+    raw_edges = out.get("edges")
+    if isinstance(raw_edges, list):
+        out["edges"] = [_sanitize_edge(e) for e in raw_edges]
+    return out
+
+
+def _sanitize_node(node):
+    if not isinstance(node, dict):
+        return node
+    data_cls = _NODE_DATA_CLASSES.get(node.get("type"))
+    raw_data = node.get("data")
+    if not data_cls or not isinstance(raw_data, dict):
+        return node
+    allowed = data_cls.model_fields.keys()
+    return {**node, "data": {k: v for k, v in raw_data.items() if k in allowed}}
+
+
+def _sanitize_edge(edge):
+    if not isinstance(edge, dict):
+        return edge
+    raw_data = edge.get("data")
+    if not isinstance(raw_data, dict):
+        return edge
+    allowed = EdgeDataDTO.model_fields.keys()
+    return {**edge, "data": {k: v for k, v in raw_data.items() if k in allowed}}
--- a/api/services/workflow/layout.py
+++ b/api/services/workflow/layout.py
@ -0,0 +1,105 @@
+"""Position reconciliation for LLM-edited workflows.
+
+`save_workflow` re-parses LLM-authored TypeScript into workflow JSON,
+but the parser deliberately ignores positions (LLMs place nodes
+poorly, and the authoring surface stays tighter without coordinates).
+This module fills them back in by matching the newly-parsed nodes
+against the previously-stored workflow:
+
+    1. Named match:   (type, data.name) — most reliable
+    2. Unnamed match: (type, nth-occurrence-in-order) — best effort
+    3. New nodes:     placed adjacent to their first incoming neighbor
+                      (src.x + 400, src.y + 200), or (0, 0) if orphan
+
+The UI has a proper dagre-based re-layout button
+(`ui/src/app/workflow/[workflowId]/utils/layoutNodes.ts`) users can
+invoke when they want a clean pass. This module only aims to avoid
+all-nodes-at-origin after a save.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+_DEFAULT_POSITION: dict[str, float] = {"x": 0.0, "y": 0.0}
+# Horizontal / vertical offset for newly-introduced nodes relative to
+# their first incoming neighbor. Chosen to roughly match the UI layout's
+# node spacing without overlapping the neighbor's card.
+_NEW_NODE_DX: float = 400.0
+_NEW_NODE_DY: float = 200.0
+
+
+def reconcile_positions(
+    new_wf: dict[str, Any],
+    previous_wf: dict[str, Any] | None,
+) -> dict[str, Any]:
+    """Return `new_wf` with positions filled from `previous_wf` where
+    node identity matches, and approximate positions for genuinely new
+    nodes. Mutates and returns the same dict (callers typically want
+    the mutation)."""
+    if not previous_wf:
+        _place_new_nodes(new_wf)
+        return new_wf
+
+    prev_nodes = previous_wf.get("nodes") or []
+    named_positions: dict[tuple[str, str], dict[str, float]] = {}
+    unnamed_positions: dict[str, list[dict[str, float]]] = {}
+
+    for n in prev_nodes:
+        t = n.get("type") or ""
+        name = ((n.get("data") or {}).get("name") or "").strip()
+        pos = n.get("position") or dict(_DEFAULT_POSITION)
+        if name:
+            named_positions[(t, name)] = pos
+        else:
+            unnamed_positions.setdefault(t, []).append(pos)
+
+    unnamed_cursor: dict[str, int] = {}
+
+    for node in new_wf.get("nodes") or []:
+        t = node.get("type") or ""
+        name = ((node.get("data") or {}).get("name") or "").strip()
+
+        pos: dict[str, float] | None = None
+        if name:
+            pos = named_positions.get((t, name))
+        if pos is None:
+            idx = unnamed_cursor.get(t, 0)
+            positions = unnamed_positions.get(t, [])
+            if idx < len(positions):
+                pos = positions[idx]
+                unnamed_cursor[t] = idx + 1
+        if pos is not None:
+            node["position"] = dict(pos)
+
+    _place_new_nodes(new_wf)
+    return new_wf
+
+
+def _place_new_nodes(wf: dict[str, Any]) -> None:
+    """For nodes still at (0, 0) — i.e. unmatched by any previous
+    node — pick a position adjacent to the first incoming neighbor.
+    Runs after named/unnamed matching so only genuinely-new nodes are
+    affected."""
+    nodes = wf.get("nodes") or []
+    if not nodes:
+        return
+    id_to_node = {n["id"]: n for n in nodes}
+    edges = wf.get("edges") or []
+
+    for node in nodes:
+        pos = node.get("position") or {}
+        if pos.get("x") or pos.get("y"):
+            continue  # already has a non-origin position
+        src_id = next(
+            (e["source"] for e in edges if e.get("target") == node["id"]),
+            None,
+        )
+        if src_id and src_id in id_to_node:
+            src_pos = id_to_node[src_id].get("position") or dict(_DEFAULT_POSITION)
+            node["position"] = {
+                "x": float(src_pos.get("x", 0.0)) + _NEW_NODE_DX,
+                "y": float(src_pos.get("y", 0.0)) + _NEW_NODE_DY,
+            }
+        # Leaves truly orphan new nodes at (0, 0). The UI's re-layout
+        # pass will pull them into the graph on next edit.
--- a/api/services/workflow/node_specs/init.py
+++ b/api/services/workflow/node_specs/init.py
@ -0,0 +1,82 @@
+"""Node specification registry.
+
+Adding a new node type:
+1. Create a new module under this package, define a `SPEC: NodeSpec`.
+2. Add it to the imports + REGISTRY below.
+3. The Pydantic discriminated-union variant in dto.py must use the same
+   `name` value as `SPEC.name`.
+"""
+
+from __future__ import annotations
+
+from api.services.workflow.node_specs._base import (
+    SPEC_VERSION,
+    DisplayOptions,
+    GraphConstraints,
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertyOption,
+    PropertySpec,
+    PropertyType,
+    evaluate_display_options,
+)
+
+REGISTRY: dict[str, NodeSpec] = {}
+
+
+def register(spec: NodeSpec) -> NodeSpec:
+    """Register a NodeSpec in the global registry. Returns the spec for
+    chaining at module top-level: `SPEC = register(NodeSpec(...))`."""
+    if spec.name in REGISTRY:
+        raise ValueError(
+            f"Duplicate NodeSpec registration for {spec.name!r}. "
+            f"Each node type must have exactly one spec."
+        )
+    REGISTRY[spec.name] = spec
+    return spec
+
+
+def get_spec(name: str) -> NodeSpec | None:
+    return REGISTRY.get(name)
+
+
+def all_specs() -> list[NodeSpec]:
+    """All registered specs, sorted by name for stable output."""
+    return [REGISTRY[name] for name in sorted(REGISTRY)]
+
+
+__all__ = [
+    "SPEC_VERSION",
+    "REGISTRY",
+    "DisplayOptions",
+    "GraphConstraints",
+    "NodeCategory",
+    "NodeExample",
+    "NodeSpec",
+    "PropertyOption",
+    "PropertySpec",
+    "PropertyType",
+    "all_specs",
+    "evaluate_display_options",
+    "get_spec",
+    "register",
+]
+
+
+# Side-effect imports — each module's `register(SPEC)` call populates REGISTRY.
+# Keep at module bottom so the registry helpers are defined first.
+from api.services.workflow.node_specs import (  # noqa: E402, F401
+    agent,
+    end_call,
+    global_node,
+    qa,
+    start_call,
+    trigger,
+    webhook,
+)
+
+# Wire up registrations from the SPEC constants in each module.
+for _module in (start_call, agent, end_call, global_node, trigger, webhook, qa):
+    register(_module.SPEC)
+del _module
--- a/api/services/workflow/node_specs/main.py
+++ b/api/services/workflow/node_specs/main.py
@ -0,0 +1,28 @@
+"""Dump the registered NodeSpecs to stdout as JSON.
+
+Used by `scripts/generate_sdk.sh` to feed both SDK codegens without
+requiring a running backend. Shape matches the `/api/v1/node-types`
+HTTP response so either source is interchangeable.
+
+    python -m api.services.workflow.node_specs > specs.json
+"""
+
+from __future__ import annotations
+
+import json
+import sys
+
+from api.services.workflow.node_specs import SPEC_VERSION, all_specs
+
+
+def main() -> None:
+    payload = {
+        "spec_version": SPEC_VERSION,
+        "node_types": [s.model_dump(mode="json") for s in all_specs()],
+    }
+    json.dump(payload, sys.stdout, indent=2, ensure_ascii=False)
+    sys.stdout.write("\n")
+
+
+if __name__ == "__main__":
+    main()
--- a/api/services/workflow/node_specs/_base.py
+++ b/api/services/workflow/node_specs/_base.py
@ -0,0 +1,224 @@
+"""Spec schema for node definitions.
+
+A `NodeSpec` is the single source of truth for a node type. It drives:
+- Pydantic validation (the per-type DTOs in dto.py mirror these property types)
+- The generic UI renderer (frontend reads specs via /api/v1/node-types)
+- The LLM SDK (constructors and JSON-Schema derived from these specs)
+
+Every property's `description` is LLM-readable copy — treat it as production
+documentation, not internal notes. Spec lint enforces non-empty descriptions
+and example coverage.
+"""
+
+from __future__ import annotations
+
+from enum import Enum
+from typing import Any, Optional
+
+from pydantic import BaseModel, ConfigDict, Field
+
+# Spec contract version. Bump when adding new PropertyType values or making
+# breaking changes to the NodeSpec wire shape. SDK clients warn on mismatch.
+SPEC_VERSION = "1.0.0"
+
+
+class PropertyType(str, Enum):
+    """Bounded vocabulary of property types the renderer dispatches on.
+
+    Adding a value here requires a matching arm in the frontend
+    `<PropertyInput>` switch and (where relevant) the SDK codegen template.
+    """
+
+    string = "string"
+    number = "number"
+    boolean = "boolean"
+    options = "options"  # single-select dropdown
+    multi_options = "multi_options"  # multi-select
+    fixed_collection = "fixed_collection"  # repeating rows of sub-properties
+    json = "json"  # arbitrary JSON object editor
+
+    # Domain-specific reference types — values are UUIDs/keys looked up against
+    # a reference catalog (list_tools, list_documents, list_recordings,
+    # list_credentials).
+    tool_refs = "tool_refs"
+    document_refs = "document_refs"
+    recording_ref = "recording_ref"
+    credential_ref = "credential_ref"
+
+    # Domain-specific input widgets
+    mention_textarea = "mention_textarea"  # textarea with {{var}} mentions
+    url = "url"
+
+
+class NodeCategory(str, Enum):
+    """Drives grouping in the AddNodePanel UI."""
+
+    call_node = "call_node"
+    global_node = "global_node"
+    trigger = "trigger"
+    integration = "integration"
+
+
+class DisplayOptions(BaseModel):
+    """Conditional visibility rules.
+
+    `show` keys are AND-combined: this property is visible only when EVERY
+    referenced field's value matches one of the listed values.
+
+    `hide` keys are OR-combined: this property is hidden when ANY referenced
+    field's value matches one of the listed values.
+
+    Example:
+        DisplayOptions(show={"extraction_enabled": [True]})
+        DisplayOptions(show={"greeting_type": ["audio"]})
+    """
+
+    show: Optional[dict[str, list[Any]]] = None
+    hide: Optional[dict[str, list[Any]]] = None
+
+    model_config = ConfigDict(extra="forbid")
+
+
+def evaluate_display_options(
+    rules: Optional[DisplayOptions | dict[str, Any]],
+    values: dict[str, Any],
+) -> bool:
+    """Reference implementation of the display_options visibility check.
+
+    Mirrored 1:1 in the TypeScript renderer
+    (`ui/src/components/flow/renderer/displayOptions.ts`). The golden
+    fixtures in `display_options_fixtures.json` lock the two
+    implementations together — update both whenever the semantics change.
+    """
+    if rules is None:
+        return True
+
+    if isinstance(rules, DisplayOptions):
+        show = rules.show
+        hide = rules.hide
+    else:
+        show = rules.get("show")
+        hide = rules.get("hide")
+
+    if show:
+        for field, allowed in show.items():
+            if values.get(field) not in allowed:
+                return False
+
+    if hide:
+        for field, hidden in hide.items():
+            if values.get(field) in hidden:
+                return False
+
+    return True
+
+
+class PropertyOption(BaseModel):
+    """An option in an `options` or `multi_options` dropdown."""
+
+    value: str | int | bool | float
+    label: str
+    description: Optional[str] = None
+
+    model_config = ConfigDict(extra="forbid")
+
+
+class PropertySpec(BaseModel):
+    """Single field on a node.
+
+    `description` is HUMAN-FACING — shown under the field in the edit
+    dialog. Keep it concise and explain what the field does.
+
+    `llm_hint` is LLM-FACING — appears only in the `get_node_type` MCP
+    response and in SDK schema output. Use it for catalog tool references
+    (e.g., "Use `list_recordings`"), array shape, expected value idioms,
+    or anything that would be noise in the UI. Optional; omit when the
+    `description` already suffices for both audiences.
+    """
+
+    name: str
+    type: PropertyType
+    display_name: str
+    description: str = Field(
+        ...,
+        min_length=1,
+        description="Human-facing explanation shown in the UI.",
+    )
+    llm_hint: Optional[str] = Field(
+        default=None,
+        description="LLM-only guidance; omitted from the UI.",
+    )
+    default: Any = None
+    required: bool = False
+    placeholder: Optional[str] = None
+
+    display_options: Optional[DisplayOptions] = None
+
+    # For `options` / `multi_options`
+    options: Optional[list[PropertyOption]] = None
+
+    # For `fixed_collection` — sub-properties of each row
+    properties: Optional[list["PropertySpec"]] = None
+
+    # Validation hints. Enforced by Pydantic where possible.
+    min_value: Optional[float] = None
+    max_value: Optional[float] = None
+    min_length: Optional[int] = None
+    max_length: Optional[int] = None
+    pattern: Optional[str] = None
+
+    # Renderer hint, e.g. "textarea" vs single-line for `string`.
+    editor: Optional[str] = None
+
+    # Free-form metadata for renderer-specific behavior. Use sparingly.
+    extra: dict[str, Any] = Field(default_factory=dict)
+
+    model_config = ConfigDict(extra="forbid")
+
+
+PropertySpec.model_rebuild()
+
+
+class NodeExample(BaseModel):
+    """A worked example LLMs can pattern-match. Keep small and realistic."""
+
+    name: str
+    description: Optional[str] = None
+    data: dict[str, Any]
+
+    model_config = ConfigDict(extra="forbid")
+
+
+class GraphConstraints(BaseModel):
+    """Per-node-type graph rules. WorkflowGraph enforces these at validation."""
+
+    min_incoming: Optional[int] = None
+    max_incoming: Optional[int] = None
+    min_outgoing: Optional[int] = None
+    max_outgoing: Optional[int] = None
+
+    model_config = ConfigDict(extra="forbid")
+
+
+class NodeSpec(BaseModel):
+    """Single source of truth for a node type."""
+
+    name: str  # machine name; matches the Pydantic discriminator value
+    display_name: str
+    description: str = Field(
+        ...,
+        min_length=1,
+        description="Human-facing explanation shown in AddNodePanel.",
+    )
+    llm_hint: Optional[str] = Field(
+        default=None,
+        description="LLM-only guidance; omitted from the UI.",
+    )
+    category: NodeCategory
+    icon: str  # lucide-react icon name (e.g., "Play")
+    version: str = "1.0.0"
+    properties: list[PropertySpec]
+    examples: list[NodeExample] = Field(default_factory=list)
+    graph_constraints: Optional[GraphConstraints] = None
+
+    model_config = ConfigDict(extra="forbid")
--- a/api/services/workflow/node_specs/agent.py
+++ b/api/services/workflow/node_specs/agent.py
@ -0,0 +1,168 @@
+"""Spec for the Agent node — the workhorse mid-call node where the LLM
+executes a focused conversational step with optional tools and documents."""
+
+from api.services.workflow.node_specs._base import (
+    DisplayOptions,
+    GraphConstraints,
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertyOption,
+    PropertySpec,
+    PropertyType,
+)
+
+SPEC = NodeSpec(
+    name="agentNode",
+    display_name="Agent Node",
+    description="Conversational step — the LLM runs one focused exchange.",
+    llm_hint=(
+        "Mid-call step executed by the LLM. Most workflows are a chain of "
+        "agent nodes connected by edges that describe transition conditions. "
+        "Each agent node can invoke tools and reference documents."
+    ),
+    category=NodeCategory.call_node,
+    icon="Headset",
+    properties=[
+        PropertySpec(
+            name="name",
+            type=PropertyType.string,
+            display_name="Name",
+            description=(
+                "Short identifier for this step (e.g., 'Qualify Budget'). "
+                "Appears in call logs and edge transition tools."
+            ),
+            required=True,
+            min_length=1,
+            default="Agent",
+        ),
+        PropertySpec(
+            name="prompt",
+            type=PropertyType.mention_textarea,
+            display_name="Prompt",
+            description=(
+                "Agent system prompt for this step. Supports "
+                "{{template_variables}} from extraction or pre-call fetch."
+            ),
+            required=True,
+            min_length=1,
+            placeholder="Ask the caller about their budget and timeline.",
+        ),
+        PropertySpec(
+            name="allow_interrupt",
+            type=PropertyType.boolean,
+            display_name="Allow Interruption",
+            description=(
+                "When true, the user can interrupt the agent mid-utterance. "
+                "Set false for non-interruptible disclosures."
+            ),
+            default=True,
+        ),
+        PropertySpec(
+            name="add_global_prompt",
+            type=PropertyType.boolean,
+            display_name="Add Global Prompt",
+            description=(
+                "When true and a Global node exists, prepends the global "
+                "prompt to this node's prompt at runtime."
+            ),
+            default=True,
+        ),
+        PropertySpec(
+            name="extraction_enabled",
+            type=PropertyType.boolean,
+            display_name="Enable Variable Extraction",
+            description=(
+                "When true, runs an LLM extraction pass on transition out of "
+                "this node to capture variables from the conversation."
+            ),
+            default=False,
+        ),
+        PropertySpec(
+            name="extraction_prompt",
+            type=PropertyType.string,
+            display_name="Extraction Prompt",
+            description="Overall instructions guiding variable extraction.",
+            display_options=DisplayOptions(show={"extraction_enabled": [True]}),
+            editor="textarea",
+        ),
+        PropertySpec(
+            name="extraction_variables",
+            type=PropertyType.fixed_collection,
+            display_name="Variables to Extract",
+            description=(
+                "Each entry declares one variable to capture from the "
+                "conversation, with its name, type, and per-variable hint."
+            ),
+            display_options=DisplayOptions(show={"extraction_enabled": [True]}),
+            properties=[
+                PropertySpec(
+                    name="name",
+                    type=PropertyType.string,
+                    display_name="Variable Name",
+                    description="snake_case identifier used downstream.",
+                    required=True,
+                ),
+                PropertySpec(
+                    name="type",
+                    type=PropertyType.options,
+                    display_name="Type",
+                    description="Data type of the extracted value.",
+                    required=True,
+                    default="string",
+                    options=[
+                        PropertyOption(value="string", label="String"),
+                        PropertyOption(value="number", label="Number"),
+                        PropertyOption(value="boolean", label="Boolean"),
+                    ],
+                ),
+                PropertySpec(
+                    name="prompt",
+                    type=PropertyType.string,
+                    display_name="Extraction Hint",
+                    description="Per-variable hint describing what to look for.",
+                    editor="textarea",
+                ),
+            ],
+        ),
+        PropertySpec(
+            name="tool_uuids",
+            type=PropertyType.tool_refs,
+            display_name="Tools",
+            description="Tools the agent can invoke during this step.",
+            llm_hint="List of tool UUIDs from `list_tools`.",
+        ),
+        PropertySpec(
+            name="document_uuids",
+            type=PropertyType.document_refs,
+            display_name="Knowledge Base Documents",
+            description="Documents the agent can reference during this step.",
+            llm_hint="List of document UUIDs from `list_documents`.",
+        ),
+    ],
+    examples=[
+        NodeExample(
+            name="qualify_lead",
+            data={
+                "name": "Qualify Budget",
+                "prompt": "Ask about budget and timeline. Capture both before transitioning.",
+                "allow_interrupt": True,
+                "extraction_enabled": True,
+                "extraction_prompt": "Extract budget amount and rough timeline.",
+                "extraction_variables": [
+                    {
+                        "name": "budget_usd",
+                        "type": "number",
+                        "prompt": "Stated budget in USD",
+                    },
+                    {
+                        "name": "timeline",
+                        "type": "string",
+                        "prompt": "When they want to start",
+                    },
+                ],
+            },
+        ),
+    ],
+    graph_constraints=GraphConstraints(min_incoming=1),
+)
--- a/api/services/workflow/node_specs/display_options_fixtures.json
+++ b/api/services/workflow/node_specs/display_options_fixtures.json
@ -0,0 +1,123 @@
+{
+  "_doc": "Golden fixtures for the display_options evaluator. Both the Python evaluator (api/services/workflow/node_specs/_base.py:evaluate_display_options) and the TypeScript evaluator (ui/src/components/flow/renderer/displayOptions.ts:evaluateDisplayOptions) must agree on every case here. Fixtures double as documentation for the show/hide semantics.",
+  "cases": [
+    {
+      "name": "no_rules_visible",
+      "rules": null,
+      "values": {"a": 1},
+      "expected": true
+    },
+    {
+      "name": "empty_rules_visible",
+      "rules": {"show": null, "hide": null},
+      "values": {},
+      "expected": true
+    },
+    {
+      "name": "show_match_visible",
+      "rules": {"show": {"extraction_enabled": [true]}},
+      "values": {"extraction_enabled": true},
+      "expected": true
+    },
+    {
+      "name": "show_mismatch_hidden",
+      "rules": {"show": {"extraction_enabled": [true]}},
+      "values": {"extraction_enabled": false},
+      "expected": false
+    },
+    {
+      "name": "show_missing_field_hidden",
+      "rules": {"show": {"extraction_enabled": [true]}},
+      "values": {},
+      "expected": false
+    },
+    {
+      "name": "show_multiple_allowed_values",
+      "rules": {"show": {"greeting_type": ["text", "audio"]}},
+      "values": {"greeting_type": "audio"},
+      "expected": true
+    },
+    {
+      "name": "show_multiple_keys_all_match",
+      "rules": {
+        "show": {
+          "qa_use_workflow_llm": [false],
+          "qa_provider": ["azure"]
+        }
+      },
+      "values": {"qa_use_workflow_llm": false, "qa_provider": "azure"},
+      "expected": true
+    },
+    {
+      "name": "show_multiple_keys_one_mismatch_hides",
+      "rules": {
+        "show": {
+          "qa_use_workflow_llm": [false],
+          "qa_provider": ["azure"]
+        }
+      },
+      "values": {"qa_use_workflow_llm": false, "qa_provider": "openai"},
+      "expected": false
+    },
+    {
+      "name": "hide_match_hides",
+      "rules": {"hide": {"locked": [true]}},
+      "values": {"locked": true},
+      "expected": false
+    },
+    {
+      "name": "hide_mismatch_visible",
+      "rules": {"hide": {"locked": [true]}},
+      "values": {"locked": false},
+      "expected": true
+    },
+    {
+      "name": "hide_missing_field_visible",
+      "rules": {"hide": {"locked": [true]}},
+      "values": {},
+      "expected": true
+    },
+    {
+      "name": "hide_or_combined_either_hides",
+      "rules": {"hide": {"a": [1], "b": [2]}},
+      "values": {"a": 0, "b": 2},
+      "expected": false
+    },
+    {
+      "name": "show_and_hide_both_required",
+      "rules": {"show": {"enabled": [true]}, "hide": {"locked": [true]}},
+      "values": {"enabled": true, "locked": false},
+      "expected": true
+    },
+    {
+      "name": "show_and_hide_show_passes_hide_blocks",
+      "rules": {"show": {"enabled": [true]}, "hide": {"locked": [true]}},
+      "values": {"enabled": true, "locked": true},
+      "expected": false
+    },
+    {
+      "name": "show_and_hide_show_fails_hide_irrelevant",
+      "rules": {"show": {"enabled": [true]}, "hide": {"locked": [true]}},
+      "values": {"enabled": false, "locked": false},
+      "expected": false
+    },
+    {
+      "name": "scalar_int_strict",
+      "rules": {"show": {"sample_rate": [100]}},
+      "values": {"sample_rate": 100},
+      "expected": true
+    },
+    {
+      "name": "scalar_int_mismatch",
+      "rules": {"show": {"sample_rate": [100]}},
+      "values": {"sample_rate": 99},
+      "expected": false
+    },
+    {
+      "name": "scalar_string_strict",
+      "rules": {"show": {"http_method": ["POST", "PUT"]}},
+      "values": {"http_method": "GET"},
+      "expected": false
+    }
+  ]
+}
--- a/api/services/workflow/node_specs/end_call.py
+++ b/api/services/workflow/node_specs/end_call.py
@ -0,0 +1,141 @@
+"""Spec for the End Call node — terminal node that wraps up a conversation
+and optionally extracts variables before hangup."""
+
+from api.services.workflow.node_specs._base import (
+    DisplayOptions,
+    GraphConstraints,
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertyOption,
+    PropertySpec,
+    PropertyType,
+)
+
+SPEC = NodeSpec(
+    name="endCall",
+    display_name="End Call",
+    description="Closes the conversation and hangs up.",
+    llm_hint=(
+        "Terminal node that politely closes the conversation. Variable "
+        "extraction can run before hangup. A workflow can have multiple "
+        "endCall nodes reached via different edge conditions."
+    ),
+    category=NodeCategory.call_node,
+    icon="OctagonX",
+    properties=[
+        PropertySpec(
+            name="name",
+            type=PropertyType.string,
+            display_name="Name",
+            description=(
+                "Short identifier shown in call logs. Should describe the "
+                "ending context (e.g., 'Successful close', 'Polite decline')."
+            ),
+            required=True,
+            min_length=1,
+            default="End Call",
+        ),
+        PropertySpec(
+            name="prompt",
+            type=PropertyType.mention_textarea,
+            display_name="Prompt",
+            description=(
+                "Agent system prompt for the closing exchange. Supports "
+                "{{template_variables}} from extraction or pre-call fetch."
+            ),
+            required=True,
+            min_length=1,
+            placeholder="Thank the caller and confirm next steps before ending the call.",
+        ),
+        PropertySpec(
+            name="add_global_prompt",
+            type=PropertyType.boolean,
+            display_name="Add Global Prompt",
+            description=(
+                "When true and a Global node exists, prepends the global "
+                "prompt to this node's prompt at runtime."
+            ),
+            default=False,
+        ),
+        PropertySpec(
+            name="extraction_enabled",
+            type=PropertyType.boolean,
+            display_name="Enable Variable Extraction",
+            description=(
+                "When true, runs an LLM extraction pass before hangup to "
+                "capture variables from the conversation."
+            ),
+            default=False,
+        ),
+        PropertySpec(
+            name="extraction_prompt",
+            type=PropertyType.string,
+            display_name="Extraction Prompt",
+            description=(
+                "Overall instructions guiding how variables should be "
+                "extracted from the conversation."
+            ),
+            display_options=DisplayOptions(show={"extraction_enabled": [True]}),
+            editor="textarea",
+        ),
+        PropertySpec(
+            name="extraction_variables",
+            type=PropertyType.fixed_collection,
+            display_name="Variables to Extract",
+            description=(
+                "Each entry declares one variable to capture from the "
+                "conversation, with its name, data type, and a per-variable "
+                "extraction hint."
+            ),
+            display_options=DisplayOptions(show={"extraction_enabled": [True]}),
+            properties=[
+                PropertySpec(
+                    name="name",
+                    type=PropertyType.string,
+                    display_name="Variable Name",
+                    description="snake_case identifier used downstream.",
+                    required=True,
+                ),
+                PropertySpec(
+                    name="type",
+                    type=PropertyType.options,
+                    display_name="Type",
+                    description="The data type of the extracted value.",
+                    required=True,
+                    default="string",
+                    options=[
+                        PropertyOption(value="string", label="String"),
+                        PropertyOption(value="number", label="Number"),
+                        PropertyOption(value="boolean", label="Boolean"),
+                    ],
+                ),
+                PropertySpec(
+                    name="prompt",
+                    type=PropertyType.string,
+                    display_name="Extraction Hint",
+                    description=(
+                        "Per-variable hint describing what to look for in "
+                        "the conversation."
+                    ),
+                    editor="textarea",
+                ),
+            ],
+        ),
+    ],
+    examples=[
+        NodeExample(
+            name="successful_close",
+            data={
+                "name": "Successful Close",
+                "prompt": "Confirm the appointment time, thank the caller, and end the call.",
+                "add_global_prompt": False,
+            },
+        ),
+    ],
+    graph_constraints=GraphConstraints(
+        min_incoming=1,
+        min_outgoing=0,
+        max_outgoing=0,
+    ),
+)
--- a/api/services/workflow/node_specs/global_node.py
+++ b/api/services/workflow/node_specs/global_node.py
@ -0,0 +1,77 @@
+"""Spec for the Global node — system-level instructions appended to every
+agent node that opts in via `add_global_prompt`."""
+
+from api.services.workflow.node_specs._base import (
+    GraphConstraints,
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertySpec,
+    PropertyType,
+)
+
+SPEC = NodeSpec(
+    name="globalNode",
+    display_name="Global Node",
+    description="Persona/tone appended to every agent node's prompt.",
+    llm_hint=(
+        "System-level prompt appended to every prompted node whose "
+        "`add_global_prompt` is true. Use it for persona, tone, and shared "
+        "rules that apply across the entire conversation. At most one "
+        "global node per workflow."
+    ),
+    category=NodeCategory.global_node,
+    icon="Globe",
+    properties=[
+        PropertySpec(
+            name="name",
+            type=PropertyType.string,
+            display_name="Name",
+            description=(
+                "Short identifier shown in the canvas and call logs. Has no "
+                "runtime effect."
+            ),
+            required=True,
+            min_length=1,
+            default="Global Node",
+        ),
+        PropertySpec(
+            name="prompt",
+            type=PropertyType.mention_textarea,
+            display_name="Global Prompt",
+            description=(
+                "Text appended to every prompted node's system prompt when "
+                "that node has `add_global_prompt=true`. Supports "
+                "{{template_variables}}."
+            ),
+            required=True,
+            min_length=1,
+            placeholder="You are a friendly assistant calling on behalf of {{company_name}}.",
+            default=(
+                "You are a helpful assistant whose mode of interaction with "
+                "the user is voice. So don't use any special characters which "
+                "can not be pronounced. Use short sentences and simple language."
+            ),
+        ),
+    ],
+    examples=[
+        NodeExample(
+            name="basic_persona",
+            description="Establishes a consistent persona across the call.",
+            data={
+                "name": "Persona",
+                "prompt": (
+                    "You are Sarah, a polite and warm representative from "
+                    "Acme Corp. Always thank the caller for their time and "
+                    "speak in short conversational sentences."
+                ),
+            },
+        ),
+    ],
+    graph_constraints=GraphConstraints(
+        min_incoming=0,
+        max_incoming=0,
+        min_outgoing=0,
+        max_outgoing=0,
+    ),
+)
--- a/api/services/workflow/node_specs/qa.py
+++ b/api/services/workflow/node_specs/qa.py
@ -0,0 +1,196 @@
+"""Spec for the QA Analysis node — runs an LLM quality review on the call
+transcript after completion."""
+
+from api.services.workflow.node_specs._base import (
+    DisplayOptions,
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertyOption,
+    PropertySpec,
+    PropertyType,
+)
+
+DEFAULT_QA_SYSTEM_PROMPT = """You are a QA analyst evaluating a specific segment of a voice AI conversation.
+
+## Node Purpose
+{{node_summary}}
+
+## Previous Conversation Context (For start of conversation, previous conversation summary can be empty.)
+{{previous_conversation_summary}}
+
+## Tags to evaluate
+
+Examine the conversation carefully and identify which of the following tags apply:
+
+- UNCLEAR_CONVERSATION - The conversation is not coherent or clear, messages don't connect logically
+- ASSISTANT_IN_LOOP - The assistant asks the same question multiple times or gets stuck repeating itself
+- ASSISTANT_REPLY_IMPROPER - The assistant did not reply properly to the user's question/query or seems confused by what the user said
+- USER_FRUSTRATED - The user seems angry, frustrated, or is complaining about something in the call
+- USER_NOT_UNDERSTANDING - The user explicitly says they don't understand or repeatedly asks for clarification
+- HEARING_ISSUES - Either party can't hear the other ("hello?", "are you there?", "can you hear me?")
+- DEAD_AIR - Unusually long silences in the conversation (use the timestamps to judge)
+- USER_REQUESTING_FEATURE - The user asks for something the assistant can't fulfill
+- ASSISTANT_LACKS_EMPATHY - The assistant ignores the user's personal situation or emotional state and continues pitching or pushing the agenda.
+- USER_DETECTS_AI - The user suspects or identifies that they are talking to an AI/robot/bot rather than a real human.
+
+## Call metrics (pre-computed)
+
+Use these alongside the transcript for your analysis:
+{{metrics}}
+
+## Output format
+
+Return ONLY a valid JSON object (no markdown):
+{
+    "tags": [
+        {
+            "tag": "TAG_NAME",
+            "reason": "Short reason with evidence from the transcript"
+        }
+    ],
+    "overall_sentiment": "positive|neutral|negative",
+    "call_quality_score": <1-10>,
+    "summary": "1-2 sentence summary of this segment"
+}
+
+If no tags apply, return an empty tags list. Always provide sentiment, score, and summary."""
+
+
+SPEC = NodeSpec(
+    name="qa",
+    display_name="QA Analysis",
+    description="Run LLM quality analysis on the call transcript.",
+    llm_hint=(
+        "Runs an LLM quality review on the call transcript after completion. "
+        "Per-node analysis splits the conversation by node and evaluates each "
+        "segment against the configured system prompt. Sampling, minimum "
+        "duration, and voicemail filters are supported."
+    ),
+    category=NodeCategory.integration,
+    icon="ClipboardCheck",
+    properties=[
+        PropertySpec(
+            name="name",
+            type=PropertyType.string,
+            display_name="Name",
+            description="Short identifier for this QA configuration.",
+            required=True,
+            min_length=1,
+            default="QA Analysis",
+        ),
+        PropertySpec(
+            name="qa_enabled",
+            type=PropertyType.boolean,
+            display_name="Enabled",
+            description="When false, the QA run is skipped.",
+            default=True,
+        ),
+        PropertySpec(
+            name="qa_system_prompt",
+            type=PropertyType.string,
+            display_name="System Prompt",
+            description=(
+                "Instructions to the QA reviewer LLM. Supports placeholders: "
+                "`{node_summary}`, `{previous_conversation_summary}`, "
+                "`{transcript}`, `{metrics}`."
+            ),
+            editor="textarea",
+            default=DEFAULT_QA_SYSTEM_PROMPT,
+        ),
+        PropertySpec(
+            name="qa_min_call_duration",
+            type=PropertyType.number,
+            display_name="Minimum Call Duration (seconds)",
+            description="Calls shorter than this are skipped.",
+            default=15,
+            min_value=0,
+        ),
+        PropertySpec(
+            name="qa_voicemail_calls",
+            type=PropertyType.boolean,
+            display_name="Include Voicemail Calls",
+            description="When false, calls flagged as voicemail are skipped.",
+            default=False,
+        ),
+        PropertySpec(
+            name="qa_sample_rate",
+            type=PropertyType.number,
+            display_name="Sample Rate (%)",
+            description=(
+                "Percent of eligible calls QA'd. 100 means every call; lower "
+                "values use random sampling."
+            ),
+            default=100,
+            min_value=1,
+            max_value=100,
+        ),
+        # ---- LLM configuration ----
+        PropertySpec(
+            name="qa_use_workflow_llm",
+            type=PropertyType.boolean,
+            display_name="Use Workflow's LLM",
+            description=(
+                "When true, the QA pass uses the same LLM the workflow runs "
+                "with. Set false to specify a separate provider/model."
+            ),
+            default=True,
+        ),
+        PropertySpec(
+            name="qa_provider",
+            type=PropertyType.options,
+            display_name="QA LLM Provider",
+            description="LLM provider used for the QA pass.",
+            display_options=DisplayOptions(show={"qa_use_workflow_llm": [False]}),
+            options=[
+                PropertyOption(value="openai", label="OpenAI"),
+                PropertyOption(value="azure", label="Azure OpenAI"),
+                PropertyOption(value="openrouter", label="OpenRouter"),
+                PropertyOption(value="anthropic", label="Anthropic"),
+            ],
+        ),
+        PropertySpec(
+            name="qa_model",
+            type=PropertyType.string,
+            display_name="QA Model",
+            description=(
+                "Model identifier (e.g., 'gpt-4o', 'claude-sonnet-4-6'). "
+                "Provider-specific."
+            ),
+            display_options=DisplayOptions(show={"qa_use_workflow_llm": [False]}),
+            default="default",
+        ),
+        PropertySpec(
+            name="qa_api_key",
+            type=PropertyType.string,
+            display_name="API Key",
+            description="API key for the chosen provider.",
+            display_options=DisplayOptions(show={"qa_use_workflow_llm": [False]}),
+        ),
+        PropertySpec(
+            name="qa_endpoint",
+            type=PropertyType.url,
+            display_name="Azure Endpoint",
+            description="Required for the Azure provider.",
+            display_options=DisplayOptions(
+                show={"qa_use_workflow_llm": [False], "qa_provider": ["azure"]}
+            ),
+        ),
+    ],
+    examples=[
+        NodeExample(
+            name="basic_qa",
+            data={
+                "name": "Compliance Check",
+                "qa_enabled": True,
+                "qa_system_prompt": (
+                    "You are a compliance reviewer. Review the transcript and "
+                    "produce a JSON object with `tags`, `summary`, "
+                    "`call_quality_score`, and `overall_sentiment`."
+                ),
+                "qa_min_call_duration": 30,
+                "qa_sample_rate": 100,
+            },
+        ),
+    ],
+)
--- a/api/services/workflow/node_specs/start_call.py
+++ b/api/services/workflow/node_specs/start_call.py
@ -0,0 +1,248 @@
+"""Spec for the Start Call node — the single entry point of every workflow.
+Carries greeting, pre-call data fetch, and the same prompt/extraction/tools
+fields as agent nodes."""
+
+from api.services.workflow.node_specs._base import (
+    DisplayOptions,
+    GraphConstraints,
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertyOption,
+    PropertySpec,
+    PropertyType,
+)
+
+SPEC = NodeSpec(
+    name="startCall",
+    display_name="Start Call",
+    description="Entry point of the workflow — plays a greeting and opens the conversation.",
+    llm_hint=(
+        "The entry point of every workflow (exactly one required). Plays an "
+        "optional greeting, can fetch context from an external API before "
+        "the call begins, and executes the first conversational turn."
+    ),
+    category=NodeCategory.call_node,
+    icon="Play",
+    properties=[
+        PropertySpec(
+            name="name",
+            type=PropertyType.string,
+            display_name="Name",
+            description="Short identifier shown in the canvas and call logs.",
+            required=True,
+            min_length=1,
+            default="Start Call",
+        ),
+        # ---- Greeting (variant via greeting_type) ----
+        PropertySpec(
+            name="greeting_type",
+            type=PropertyType.options,
+            display_name="Greeting Type",
+            description=(
+                "Whether the optional greeting is spoken via TTS from text "
+                "or played from a pre-recorded audio file."
+            ),
+            default="text",
+            options=[
+                PropertyOption(value="text", label="Text (TTS)"),
+                PropertyOption(value="audio", label="Pre-recorded Audio"),
+            ],
+        ),
+        PropertySpec(
+            name="greeting",
+            type=PropertyType.string,
+            display_name="Greeting Text",
+            description=(
+                "Text spoken via TTS at the start of the call. Supports "
+                "{{template_variables}}. Leave empty to skip the greeting."
+            ),
+            display_options=DisplayOptions(show={"greeting_type": ["text"]}),
+            editor="textarea",
+            placeholder="Hi {{first_name}}, this is Sarah from Acme.",
+        ),
+        PropertySpec(
+            name="greeting_recording_id",
+            type=PropertyType.recording_ref,
+            display_name="Greeting Recording",
+            description="Pre-recorded audio file played at the start of the call.",
+            llm_hint=(
+                "Value is the `recording_id` string. Use the `list_recordings` "
+                "MCP tool to discover available recordings."
+            ),
+            display_options=DisplayOptions(show={"greeting_type": ["audio"]}),
+        ),
+        PropertySpec(
+            name="prompt",
+            type=PropertyType.mention_textarea,
+            display_name="Prompt",
+            description=(
+                "Agent system prompt for the opening turn. Supports "
+                "{{template_variables}} from pre-call fetch and the initial context."
+            ),
+            required=True,
+            min_length=1,
+            placeholder="Greet the caller warmly and ask how you can help today.",
+        ),
+        # ---- Behavior toggles ----
+        PropertySpec(
+            name="allow_interrupt",
+            type=PropertyType.boolean,
+            display_name="Allow Interruption",
+            description=("When true, the user can interrupt the agent mid-utterance."),
+            default=False,
+        ),
+        PropertySpec(
+            name="add_global_prompt",
+            type=PropertyType.boolean,
+            display_name="Add Global Prompt",
+            description=(
+                "When true and a Global node exists, prepends the global "
+                "prompt to this node's prompt at runtime."
+            ),
+            default=True,
+        ),
+        PropertySpec(
+            name="delayed_start",
+            type=PropertyType.boolean,
+            display_name="Delayed Start",
+            description=(
+                "When true, the agent waits before speaking after pickup. "
+                "Useful for outbound calls where the called party needs a "
+                "moment to settle."
+            ),
+            default=False,
+        ),
+        PropertySpec(
+            name="delayed_start_duration",
+            type=PropertyType.number,
+            display_name="Delay Duration (seconds)",
+            description="Seconds to wait before the agent speaks. 0.1–10.",
+            default=2.0,
+            min_value=0.1,
+            max_value=10.0,
+            display_options=DisplayOptions(show={"delayed_start": [True]}),
+        ),
+        # ---- Variable extraction ----
+        PropertySpec(
+            name="extraction_enabled",
+            type=PropertyType.boolean,
+            display_name="Enable Variable Extraction",
+            description=(
+                "When true, runs an LLM extraction pass on transition out of "
+                "this node to capture variables from the opening turn."
+            ),
+            default=False,
+        ),
+        PropertySpec(
+            name="extraction_prompt",
+            type=PropertyType.string,
+            display_name="Extraction Prompt",
+            description="Overall instructions guiding variable extraction.",
+            display_options=DisplayOptions(show={"extraction_enabled": [True]}),
+            editor="textarea",
+        ),
+        PropertySpec(
+            name="extraction_variables",
+            type=PropertyType.fixed_collection,
+            display_name="Variables to Extract",
+            description=(
+                "Each entry declares one variable to capture, with its name, "
+                "data type, and per-variable extraction hint."
+            ),
+            display_options=DisplayOptions(show={"extraction_enabled": [True]}),
+            properties=[
+                PropertySpec(
+                    name="name",
+                    type=PropertyType.string,
+                    display_name="Variable Name",
+                    description="snake_case identifier used downstream.",
+                    required=True,
+                ),
+                PropertySpec(
+                    name="type",
+                    type=PropertyType.options,
+                    display_name="Type",
+                    description="Data type of the extracted value.",
+                    required=True,
+                    default="string",
+                    options=[
+                        PropertyOption(value="string", label="String"),
+                        PropertyOption(value="number", label="Number"),
+                        PropertyOption(value="boolean", label="Boolean"),
+                    ],
+                ),
+                PropertySpec(
+                    name="prompt",
+                    type=PropertyType.string,
+                    display_name="Extraction Hint",
+                    description="Per-variable hint describing what to look for.",
+                    editor="textarea",
+                ),
+            ],
+        ),
+        # ---- Tools / documents ----
+        PropertySpec(
+            name="tool_uuids",
+            type=PropertyType.tool_refs,
+            display_name="Tools",
+            description="Tools the agent can invoke during the opening turn.",
+            llm_hint="List of tool UUIDs from `list_tools`.",
+        ),
+        PropertySpec(
+            name="document_uuids",
+            type=PropertyType.document_refs,
+            display_name="Knowledge Base Documents",
+            description="Documents the agent can reference.",
+            llm_hint="List of document UUIDs from `list_documents`.",
+        ),
+        # ---- Pre-call data fetch (advanced) ----
+        PropertySpec(
+            name="pre_call_fetch_enabled",
+            type=PropertyType.boolean,
+            display_name="Pre-Call Data Fetch",
+            description=(
+                "When true, makes a POST request to an external API before "
+                "the call starts and merges the JSON response into the call "
+                "context as template variables."
+            ),
+            default=False,
+        ),
+        PropertySpec(
+            name="pre_call_fetch_url",
+            type=PropertyType.url,
+            display_name="Endpoint URL",
+            description=(
+                "URL the pre-call POST request is sent to. The request body "
+                "includes caller and called numbers."
+            ),
+            display_options=DisplayOptions(show={"pre_call_fetch_enabled": [True]}),
+            placeholder="https://api.example.com/customer-lookup",
+        ),
+        PropertySpec(
+            name="pre_call_fetch_credential_uuid",
+            type=PropertyType.credential_ref,
+            display_name="Authentication",
+            description="Optional credential attached to the pre-call request.",
+            llm_hint="Credential UUID from `list_credentials`.",
+            display_options=DisplayOptions(show={"pre_call_fetch_enabled": [True]}),
+        ),
+    ],
+    examples=[
+        NodeExample(
+            name="warm_greeting",
+            data={
+                "name": "Greeting",
+                "prompt": "Greet warmly and ask the caller's reason for calling.",
+                "greeting_type": "text",
+                "greeting": "Hi {{first_name}}, this is Sarah from Acme.",
+                "allow_interrupt": True,
+            },
+        ),
+    ],
+    graph_constraints=GraphConstraints(
+        min_incoming=0,
+        max_incoming=0,
+        min_outgoing=1,
+    ),
+)
--- a/api/services/workflow/node_specs/trigger.py
+++ b/api/services/workflow/node_specs/trigger.py
@ -0,0 +1,61 @@
+"""Spec for the API Trigger node — exposes a public webhook URL that
+external systems can hit to launch the workflow."""
+
+from api.services.workflow.node_specs._base import (
+    GraphConstraints,
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertySpec,
+    PropertyType,
+)
+
+SPEC = NodeSpec(
+    name="trigger",
+    display_name="API Trigger",
+    description="Public HTTP endpoint that launches the workflow.",
+    llm_hint=(
+        "Exposes a public HTTP POST endpoint. External systems call the URL "
+        "(derived from the auto-generated `trigger_path`) to launch this "
+        "workflow. Requires an API key in the `X-API-Key` header."
+    ),
+    category=NodeCategory.trigger,
+    icon="Webhook",
+    properties=[
+        PropertySpec(
+            name="name",
+            type=PropertyType.string,
+            display_name="Name",
+            description="Short identifier shown in the canvas. No runtime effect.",
+            required=True,
+            min_length=1,
+            default="API Trigger",
+        ),
+        PropertySpec(
+            name="enabled",
+            type=PropertyType.boolean,
+            display_name="Enabled",
+            description="When false, the trigger URL returns 404.",
+            default=True,
+        ),
+        PropertySpec(
+            name="trigger_path",
+            type=PropertyType.string,
+            display_name="Trigger Path",
+            description=(
+                "Auto-generated UUID-style path segment that uniquely "
+                "identifies this trigger. Do not edit manually."
+            ),
+        ),
+    ],
+    examples=[
+        NodeExample(
+            name="default",
+            data={"name": "Inbound Trigger", "enabled": True},
+        ),
+    ],
+    graph_constraints=GraphConstraints(
+        min_incoming=0,
+        max_incoming=0,
+    ),
+)
--- a/api/services/workflow/node_specs/webhook.py
+++ b/api/services/workflow/node_specs/webhook.py
@ -0,0 +1,135 @@
+"""Spec for the Webhook node — sends an HTTP request to an external system
+after the workflow completes."""
+
+from api.services.workflow.node_specs._base import (
+    NodeCategory,
+    NodeExample,
+    NodeSpec,
+    PropertyOption,
+    PropertySpec,
+    PropertyType,
+)
+
+SPEC = NodeSpec(
+    name="webhook",
+    display_name="Webhook",
+    description="Send HTTP request after the workflow completes.",
+    llm_hint=(
+        "Sends an HTTP request to an external system after the workflow "
+        "completes. The payload is a Jinja-templated JSON body with access "
+        "to `workflow_run_id`, `initial_context`, `gathered_context`, "
+        "`annotations`, and call metadata."
+    ),
+    category=NodeCategory.integration,
+    icon="Link2",
+    properties=[
+        PropertySpec(
+            name="name",
+            type=PropertyType.string,
+            display_name="Name",
+            description="Short identifier shown in the canvas and run logs.",
+            required=True,
+            min_length=1,
+            default="Webhook",
+        ),
+        PropertySpec(
+            name="enabled",
+            type=PropertyType.boolean,
+            display_name="Enabled",
+            description="When false, the webhook is skipped at run time.",
+            default=True,
+        ),
+        PropertySpec(
+            name="http_method",
+            type=PropertyType.options,
+            display_name="HTTP Method",
+            description="HTTP verb used for the outbound request.",
+            default="POST",
+            options=[
+                PropertyOption(value="GET", label="GET"),
+                PropertyOption(value="POST", label="POST"),
+                PropertyOption(value="PUT", label="PUT"),
+                PropertyOption(value="PATCH", label="PATCH"),
+                PropertyOption(value="DELETE", label="DELETE"),
+            ],
+        ),
+        PropertySpec(
+            name="endpoint_url",
+            type=PropertyType.url,
+            display_name="Endpoint URL",
+            description="URL the request is sent to.",
+            placeholder="https://api.example.com/webhook",
+        ),
+        PropertySpec(
+            name="credential_uuid",
+            type=PropertyType.credential_ref,
+            display_name="Authentication",
+            description="Optional credential applied as the Authorization header.",
+            llm_hint="Credential UUID from `list_credentials`.",
+        ),
+        PropertySpec(
+            name="custom_headers",
+            type=PropertyType.fixed_collection,
+            display_name="Custom Headers",
+            description="Additional HTTP headers to include with the request.",
+            properties=[
+                PropertySpec(
+                    name="key",
+                    type=PropertyType.string,
+                    display_name="Header Name",
+                    description="HTTP header name (e.g., 'X-Source').",
+                    required=True,
+                ),
+                PropertySpec(
+                    name="value",
+                    type=PropertyType.string,
+                    display_name="Header Value",
+                    description="Header value (supports {{template_variables}}).",
+                    required=True,
+                ),
+            ],
+        ),
+        PropertySpec(
+            name="payload_template",
+            type=PropertyType.json,
+            display_name="Payload Template",
+            description=(
+                "JSON body of the request. Values are Jinja-rendered against "
+                "the run context — `{{workflow_run_id}}`, "
+                "`{{gathered_context.foo}}`, `{{annotations.qa_xxx}}`, etc."
+            ),
+            default={
+                "call_id": "{{workflow_run_id}}",
+                "first_name": "{{initial_context.first_name}}",
+                "rsvp": "{{gathered_context.rsvp}}",
+                "duration": "{{cost_info.call_duration_seconds}}",
+                "recording_url": "{{recording_url}}",
+                "transcript_url": "{{transcript_url}}",
+            },
+        ),
+        PropertySpec(
+            name="retry_config",
+            type=PropertyType.json,
+            display_name="Retry Configuration",
+            description=(
+                "Optional retry settings: `enabled` (bool), `max_retries` "
+                "(int), `retry_delay_seconds` (int)."
+            ),
+        ),
+    ],
+    examples=[
+        NodeExample(
+            name="post_to_crm",
+            data={
+                "name": "Notify CRM",
+                "enabled": True,
+                "http_method": "POST",
+                "endpoint_url": "https://crm.example.com/calls",
+                "payload_template": {
+                    "run_id": "{{workflow_run_id}}",
+                    "outcome": "{{gathered_context.call_disposition}}",
+                },
+            },
+        ),
+    ],
+)
--- a/api/services/workflow/pipecat_engine.py
+++ b/api/services/workflow/pipecat_engine.py
@ -243,6 +243,7 @@ class PipecatEngine:
                            else 16000,
                            queue_frame=self._transport_output.queue_frame,
                            transcript=result.transcript,
+                            persist_to_logs=True,
                        )
                    else:
                        logger.warning(
@ -252,7 +253,11 @@ class PipecatEngine:
                    logger.info(f"Playing transition speech: {transition_speech}")
                    self._queued_speech_mute_state = "waiting"
                    await self.task.queue_frame(
-                        TTSSpeakFrame(transition_speech, append_to_context=False)
+                        TTSSpeakFrame(
+                            transition_speech,
+                            append_to_context=False,
+                            persist_to_logs=True,
+                        )
                    )

                # Set context for the new node, so that when the function call result
--- a/api/services/workflow/pipecat_engine_custom_tools.py
+++ b/api/services/workflow/pipecat_engine_custom_tools.py
@ -100,6 +100,7 @@ class CustomToolManager:
                        else 16000,
                        queue_frame=self._engine._transport_output.queue_frame,
                        transcript=result.transcript,
+                        persist_to_logs=True,
                    )
                    return True
                else:
@ -110,7 +111,11 @@ class CustomToolManager:
            custom_message = config.get("customMessage", "")
            if custom_message:
                await self._engine.task.queue_frame(
-                    TTSSpeakFrame(custom_message, append_to_context=append_to_context)
+                    TTSSpeakFrame(
+                        custom_message,
+                        append_to_context=append_to_context,
+                        persist_to_logs=True,
+                    )
                )
                return True

@ -311,6 +316,7 @@ class CustomToolManager:
                                else 16000,
                                queue_frame=self._engine._transport_output.queue_frame,
                                transcript=result.transcript,
+                                persist_to_logs=True,
                            )
                elif custom_message:
                    logger.info(
@ -318,7 +324,11 @@ class CustomToolManager:
                    )
                    self._engine._queued_speech_mute_state = "waiting"
                    await self._engine.task.queue_frame(
-                        TTSSpeakFrame(custom_message, append_to_context=False)
+                        TTSSpeakFrame(
+                            custom_message,
+                            append_to_context=False,
+                            persist_to_logs=True,
+                        )
                    )

                result = await execute_http_tool(
--- a/api/services/workflow/qa/analysis.py
+++ b/api/services/workflow/qa/analysis.py
@ -8,6 +8,7 @@ from loguru import logger
 from api.db.models import WorkflowRunModel
 from api.services.gen_ai.json_parser import parse_llm_json
 from api.services.pipecat.service_factory import create_llm_service_from_provider
+from api.services.workflow.dto import QANodeData
 from api.services.workflow.qa.conversation import (
    build_conversation_structure,
    format_transcript,
@ -77,7 +78,7 @@ async def _generate_conversation_summary(


 async def run_per_node_qa_analysis(
-    qa_node_data: dict[str, Any],
+    qa_data: QANodeData,
    workflow_run: WorkflowRunModel,
    workflow_run_id: int,
    workflow_definition: dict,
@ -106,18 +107,16 @@ async def run_per_node_qa_analysis(
        logger.info(
            f"Events lack node_id for run {workflow_run_id}, falling back to whole-call QA"
        )
-        return await _run_whole_call_qa_analysis(
-            qa_node_data, workflow_run, workflow_run_id
-        )
+        return await _run_whole_call_qa_analysis(qa_data, workflow_run, workflow_run_id)

-    system_prompt = qa_node_data.get("qa_system_prompt", "")
+    system_prompt = qa_data.qa_system_prompt or ""
    if not system_prompt:
        logger.warning("No system prompt defined for QA Node")
        return {"error": "no_system_prompt", "node_results": {}}

    # Resolve LLM config
    provider, model, api_key, service_kwargs = await resolve_llm_config(
-        qa_node_data, workflow_run
+        qa_data, workflow_run
    )
    if not api_key:
        logger.warning(
@ -127,7 +126,7 @@ async def run_per_node_qa_analysis(

    # Ensure node summaries
    node_summaries = await ensure_node_summaries(
-        workflow_definition, definition_id, workflow_run, qa_node_data
+        workflow_definition, definition_id, workflow_run, qa_data
    )

    # Set up Langfuse tracing
@ -228,7 +227,7 @@ async def run_per_node_qa_analysis(


 async def _run_whole_call_qa_analysis(
-    qa_node_data: dict[str, Any],
+    qa_data: QANodeData,
    workflow_run: WorkflowRunModel,
    workflow_run_id: int,
 ) -> dict[str, Any]:
@ -254,13 +253,13 @@ async def _run_whole_call_qa_analysis(
    metrics = compute_call_metrics(rtf_events, call_duration)

    # Resolve LLM config
-    system_prompt = qa_node_data.get("qa_system_prompt", "")
+    system_prompt = qa_data.qa_system_prompt or ""
    if not system_prompt:
        logger.warning("No system prompt defined for QA Node")
        return {"error": "no_system_prompt", "node_results": {}}

    provider, model, api_key, service_kwargs = await resolve_llm_config(
-        qa_node_data, workflow_run
+        qa_data, workflow_run
    )

    if not api_key:
--- a/api/services/workflow/qa/llm_config.py
+++ b/api/services/workflow/qa/llm_config.py
@ -4,10 +4,11 @@ import random

 from api.db import db_client
 from api.db.models import WorkflowRunModel
+from api.services.workflow.dto import QANodeData


 async def resolve_llm_config(
-    qa_node_data: dict, workflow_run: WorkflowRunModel
+    qa_data: QANodeData, workflow_run: WorkflowRunModel
 ) -> tuple[str, str, str, dict]:
    """Resolve the LLM provider, model, API key, and extra kwargs for QA analysis.

@ -18,24 +19,23 @@ async def resolve_llm_config(
        (provider, model, api_key, service_kwargs) tuple — service_kwargs can be
        passed directly to create_llm_service_from_provider as keyword arguments.
    """
-    if not qa_node_data.get("qa_use_workflow_llm", True):
-        provider = qa_node_data.get("qa_provider", "openai")
+    if not qa_data.qa_use_workflow_llm:
+        provider = qa_data.qa_provider or "openai"
        kwargs = {}
        if provider == "azure":
-            kwargs["endpoint"] = qa_node_data.get("qa_endpoint", "")
+            kwargs["endpoint"] = qa_data.qa_endpoint or ""
        return (
            provider,
-            qa_node_data.get("qa_model"),
-            qa_node_data.get("qa_api_key"),
+            qa_data.qa_model,
+            qa_data.qa_api_key,
            kwargs,
        )

    # Fall back to user's configured LLM
    provider, model, api_key, kwargs = await resolve_user_llm_config(workflow_run)

-    qa_model = qa_node_data.get("qa_model", "default")
-    if qa_model and qa_model != "default":
-        model = qa_model
+    if qa_data.qa_model and qa_data.qa_model != "default":
+        model = qa_data.qa_model

    return provider, model, api_key, kwargs

--- a/api/services/workflow/qa/node_summary.py
+++ b/api/services/workflow/qa/node_summary.py
@ -7,7 +7,7 @@ from loguru import logger
 from api.db import db_client
 from api.db.models import WorkflowRunModel
 from api.services.pipecat.service_factory import create_llm_service_from_provider
-from api.services.workflow.dto import NodeType
+from api.services.workflow.dto import NodeType, QANodeData
 from api.services.workflow.qa.llm_config import resolve_llm_config
 from api.services.workflow.qa.tracing import create_node_summary_trace
 from pipecat.processors.aggregators.llm_context import LLMContext
@ -48,7 +48,7 @@ async def ensure_node_summaries(
    workflow_definition: dict,
    definition_id: int | None,
    workflow_run: WorkflowRunModel,
-    qa_node_data: dict,
+    qa_data: QANodeData,
 ) -> dict[str, Any]:
    """Ensure every agentNode/startCall node has a summary in the definition.

@ -69,7 +69,7 @@ async def ensure_node_summaries(
        return existing_summaries

    provider, model, api_key, service_kwargs = await resolve_llm_config(
-        qa_node_data, workflow_run
+        qa_data, workflow_run
    )
    if not api_key:
        logger.warning("No API key for node summary generation, skipping")
--- a/api/services/workflow/tools/knowledge_base.py
+++ b/api/services/workflow/tools/knowledge_base.py
@ -242,7 +242,6 @@ async def _perform_retrieval(

            embedding_service = OpenAIEmbeddingService(
                db_client=db_client,
-                max_tokens=128,
                api_key=embeddings_api_key,
                model_id=embeddings_model or "text-embedding-3-small",
                base_url=embeddings_base_url,
--- a/api/services/workflow/workflow.py
+++ b/api/services/workflow/workflow.py
@ -2,7 +2,7 @@ import re
 from collections import Counter
 from typing import Dict, List, Set

-from api.services.workflow.dto import EdgeDataDTO, NodeDataDTO, NodeType, ReactFlowDTO
+from api.services.workflow.dto import EdgeDataDTO, NodeType, ReactFlowDTO
 from api.services.workflow.errors import ItemKind, WorkflowError

 # Regex for matching {{ variable }} template placeholders.
@ -61,32 +61,38 @@ class Edge:


 class Node:
-    def __init__(self, id: str, node_type: NodeType, data: NodeDataDTO):
+    def __init__(self, id: str, node_type: NodeType, data):
        self.id, self.node_type, self.data = id, node_type, data
        self.out: Dict[str, "Node"] = {}  # forward nodes
        self.out_edges: List[Edge] = []  # forward edges with properties

+        # name/is_start/is_end live on every per-type data class (base).
        self.name = data.name
-        self.prompt = data.prompt
-        self.is_static = data.is_static
        self.is_start = data.is_start
        self.is_end = data.is_end
-        self.allow_interrupt = data.allow_interrupt
-        self.extraction_enabled = data.extraction_enabled
-        self.extraction_prompt = data.extraction_prompt
-        self.extraction_variables = data.extraction_variables
-        self.add_global_prompt = data.add_global_prompt
-        self.greeting = data.greeting
-        self.greeting_type = data.greeting_type
-        self.greeting_recording_id = data.greeting_recording_id
-        self.detect_voicemail = data.detect_voicemail
-        self.delayed_start = data.delayed_start
-        self.delayed_start_duration = data.delayed_start_duration
-        self.tool_uuids = data.tool_uuids
-        self.document_uuids = data.document_uuids
-        self.pre_call_fetch_enabled = data.pre_call_fetch_enabled
-        self.pre_call_fetch_url = data.pre_call_fetch_url
-        self.pre_call_fetch_credential_uuid = data.pre_call_fetch_credential_uuid
+
+        # Type-specific fields — read with getattr so this works for every
+        # node variant in the discriminated union.
+        self.prompt = getattr(data, "prompt", None)
+        self.is_static = getattr(data, "is_static", False)
+        self.allow_interrupt = getattr(data, "allow_interrupt", False)
+        self.extraction_enabled = getattr(data, "extraction_enabled", False)
+        self.extraction_prompt = getattr(data, "extraction_prompt", None)
+        self.extraction_variables = getattr(data, "extraction_variables", None)
+        self.add_global_prompt = getattr(data, "add_global_prompt", True)
+        self.greeting = getattr(data, "greeting", None)
+        self.greeting_type = getattr(data, "greeting_type", None)
+        self.greeting_recording_id = getattr(data, "greeting_recording_id", None)
+        self.detect_voicemail = getattr(data, "detect_voicemail", False)
+        self.delayed_start = getattr(data, "delayed_start", False)
+        self.delayed_start_duration = getattr(data, "delayed_start_duration", None)
+        self.tool_uuids = getattr(data, "tool_uuids", None)
+        self.document_uuids = getattr(data, "document_uuids", None)
+        self.pre_call_fetch_enabled = getattr(data, "pre_call_fetch_enabled", False)
+        self.pre_call_fetch_url = getattr(data, "pre_call_fetch_url", None)
+        self.pre_call_fetch_credential_uuid = getattr(
+            data, "pre_call_fetch_credential_uuid", None
+        )

        self.data = data

@ -98,9 +104,11 @@ class WorkflowGraph:
    """

    def __init__(self, dto: ReactFlowDTO):
-        # build adjacency list
+        # build adjacency list. n.type comes off the discriminated-union
+        # variant as a literal string; coerce to NodeType for downstream
+        # comparisons.
        self.nodes: Dict[str, Node] = {
-            n.id: Node(n.id, n.type, n.data) for n in dto.nodes
+            n.id: Node(n.id, NodeType(n.type), n.data) for n in dto.nodes
        }

        # Store all edges
--- a/api/tasks/knowledge_base_processing.py
+++ b/api/tasks/knowledge_base_processing.py
@ -1,22 +1,22 @@
-"""ARQ background task for processing knowledge base documents."""
+"""ARQ background task for processing knowledge base documents.
+
+Document conversion and chunking live in the Model Proxy Service (MPS);
+this task downloads the file from S3, calls MPS, then handles the embedding
+and DB writes locally.
+"""

-import json
 import os
 import tempfile

-from docling.chunking import HybridChunker
-from docling.document_converter import DocumentConverter
-from docling_core.transforms.chunker.tokenizer.huggingface import HuggingFaceTokenizer
 from loguru import logger
-from transformers import AutoTokenizer

 from api.db import db_client
 from api.db.models import KnowledgeBaseChunkModel
 from api.services.gen_ai import OpenAIEmbeddingService
+from api.services.mps_service_key_client import mps_service_key_client
 from api.services.storage import storage_fs

-# For tokenization/chunking
-TOKENIZER_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
+MAX_FILE_SIZE_BYTES = 5 * 1024 * 1024


 async def process_knowledge_base_document(
@ -24,93 +24,84 @@ async def process_knowledge_base_document(
    document_id: int,
    s3_key: str,
    organization_id: int,
+    created_by_provider_id: str,
    max_tokens: int = 128,
    retrieval_mode: str = "chunked",
 ):
-    """Process a knowledge base document: download, chunk, embed, and store.
+    """Process a knowledge base document via MPS: download, call MPS, embed, store.

    Args:
        ctx: ARQ context
        document_id: Database ID of the document
        s3_key: S3 key where the file is stored
        organization_id: Organization ID
+        created_by_provider_id: Uploading user's provider ID (for OSS-mode auth to MPS)
        max_tokens: Maximum number of tokens per chunk (default: 128)
        retrieval_mode: "chunked" for vector search or "full_document" for full text
    """
    logger.info(
-        f"Starting knowledge base document processing for document_id={document_id}, "
-        f"s3_key={s3_key}, organization_id={organization_id}"
+        f"Processing knowledge base document: document_id={document_id}, "
+        f"s3_key={s3_key}, org={organization_id}, mode={retrieval_mode}"
    )

    temp_file_path = None

    try:
-        # Update status to processing
        await db_client.update_document_status(document_id, "processing")

-        # Extract file extension from S3 key
        filename = s3_key.split("/")[-1]
-        file_extension = (
-            os.path.splitext(filename)[1] or ".bin"
-        )  # Default to .bin if no extension
+        file_extension = os.path.splitext(filename)[1] or ".bin"

-        # Create temp file for download with correct extension
        temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=file_extension)
        temp_file_path = temp_file.name
        temp_file.close()

-        # Download file from S3
        logger.info(f"Downloading file from S3: {s3_key}")
        download_success = await storage_fs.adownload_file(s3_key, temp_file_path)
-
        if not download_success:
            raise Exception(f"Failed to download file from S3: {s3_key}")
-
        if not os.path.exists(temp_file_path):
            raise FileNotFoundError(f"Downloaded file not found: {temp_file_path}")

        file_size = os.path.getsize(temp_file_path)
        logger.info(f"Downloaded file size: {file_size} bytes")

-        # Validate file size (max 5MB)
-        max_file_size = 5 * 1024 * 1024
-        if file_size > max_file_size:
-            error_message = f"File size ({file_size / (1024 * 1024):.1f}MB) exceeds the maximum allowed size of 5MB."
+        if file_size > MAX_FILE_SIZE_BYTES:
+            error_message = (
+                f"File size ({file_size / (1024 * 1024):.1f}MB) exceeds the "
+                f"maximum allowed size of {MAX_FILE_SIZE_BYTES // (1024 * 1024)}MB."
+            )
            logger.warning(f"Document {document_id}: {error_message}")
            await db_client.update_document_status(
                document_id, "failed", error_message=error_message
            )
            return

-        # Compute file hash and get mime type
        file_hash = db_client.compute_file_hash(temp_file_path)
        mime_type = db_client.get_mime_type(temp_file_path)
-        filename = s3_key.split("/")[-1]

-        # Get document record
        document = await db_client.get_document_by_id(document_id)
        if not document:
            raise Exception(f"Document {document_id} not found")

-        # Check if a document with this hash already exists (reject duplicates)
+        # Reject duplicates (same hash already ingested for this org).
        existing_doc = await db_client.get_document_by_hash(file_hash, organization_id)
        if existing_doc and existing_doc.id != document_id:
            error_message = (
                f"This file is a duplicate of '{existing_doc.filename}'. "
-                f"Please delete the duplicate files and consolidate them into a single unique file before uploading."
+                f"Please delete the duplicate files and consolidate them into a "
+                f"single unique file before uploading."
            )
            logger.warning(
-                f"Duplicate document detected: {document_id} is duplicate of {existing_doc.id} "
-                f"({existing_doc.filename})"
+                f"Duplicate document detected: {document_id} is duplicate of "
+                f"{existing_doc.id} ({existing_doc.filename})"
            )
-            # Update file metadata
            await db_client.update_document_metadata(
                document_id,
                file_size_bytes=file_size,
                file_hash=file_hash,
                mime_type=mime_type,
            )
-            # Mark as failed with duplicate error message
            await db_client.update_document_status(
                document_id,
                "failed",
@ -122,7 +113,6 @@ async def process_knowledge_base_document(
            )
            return

-        # Update document with file metadata
        await db_client.update_document_metadata(
            document_id,
            file_size_bytes=file_size,
@ -130,52 +120,35 @@ async def process_knowledge_base_document(
            mime_type=mime_type,
        )

-        # Full document mode: extract text and store it, skip chunking/embedding
+        logger.info(f"Delegating document processing to MPS (mode={retrieval_mode})")
+        mps_response = await mps_service_key_client.process_document(
+            file_path=temp_file_path,
+            filename=filename,
+            content_type=mime_type or "application/octet-stream",
+            retrieval_mode=retrieval_mode,
+            max_tokens=max_tokens,
+            organization_id=organization_id,
+            created_by=created_by_provider_id,
+        )
+
+        docling_metadata = mps_response.get("docling_metadata", {})
+
        if retrieval_mode == "full_document":
-            logger.info(f"Document {document_id}: full_document mode, extracting text")
-
-            plain_text_extensions = {".txt", ".json"}
-            if file_extension.lower() in plain_text_extensions:
-                with open(temp_file_path, "r", encoding="utf-8") as f:
-                    full_text = f.read()
-                if file_extension.lower() == ".json":
-                    try:
-                        parsed = json.loads(full_text)
-                        full_text = json.dumps(parsed, indent=2, ensure_ascii=False)
-                    except json.JSONDecodeError:
-                        pass
-                docling_metadata = {"document_type": "PlainText"}
-            else:
-                converter = DocumentConverter()
-                conversion_result = converter.convert(temp_file_path)
-                doc = conversion_result.document
-                full_text = doc.export_to_text()
-                docling_metadata = {
-                    "num_pages": len(doc.pages) if hasattr(doc, "pages") else None,
-                    "document_type": type(doc).__name__,
-                }
-
-            # Store full text on the document record
+            full_text = mps_response.get("full_text") or ""
            await db_client.update_document_full_text(document_id, full_text)
-
            await db_client.update_document_status(
                document_id,
                "completed",
                total_chunks=0,
                docling_metadata=docling_metadata,
            )
-
            logger.info(
                f"Successfully processed full_document {document_id}. "
                f"Text length: {len(full_text)} chars"
            )
            return

-        # Initialize the OpenAI embedding service
-        logger.info(
-            f"Initializing OpenAI embedding service with max_tokens={max_tokens}"
-        )
-        # Try to get user's embeddings configuration
+        # Chunked mode: fetch user embedding config, embed via OpenAI, persist chunks.
        embeddings_api_key = None
        embeddings_model = None
        embeddings_base_url = None
@ -187,7 +160,6 @@ async def process_knowledge_base_document(
                embeddings_base_url = getattr(user_config.embeddings, "base_url", None)
                logger.info(f"Using user embeddings config: model={embeddings_model}")

-        # Check if API key is configured
        if not embeddings_api_key:
            error_message = (
                "OpenAI API key not configured. Please set your API key in "
@ -199,190 +171,57 @@ async def process_knowledge_base_document(
            )
            return

-        service = OpenAIEmbeddingService(
+        embedding_service = OpenAIEmbeddingService(
            db_client=db_client,
-            max_tokens=max_tokens,
            api_key=embeddings_api_key,
            model_id=embeddings_model or "text-embedding-3-small",
            base_url=embeddings_base_url,
        )

-        # Step 1: Initialize tokenizer for chunking
-        logger.info(
-            f"Loading tokenizer: {TOKENIZER_MODEL} with max_tokens={max_tokens}"
-        )
-        hf_tokenizer = AutoTokenizer.from_pretrained(TOKENIZER_MODEL)
-        tokenizer = HuggingFaceTokenizer(
-            tokenizer=hf_tokenizer,
-            max_tokens=max_tokens,
-        )
+        mps_chunks = mps_response.get("chunks", [])
+        if not mps_chunks:
+            logger.warning(f"Document {document_id}: MPS returned zero chunks")

-        chunk_texts = []
        chunk_records = []
-        token_counts = []
-
-        # Check if file is a plain text format that docling doesn't support
-        plain_text_extensions = {".txt", ".json"}
-        if file_extension.lower() in plain_text_extensions:
-            # Read text content directly
-            logger.info(f"Reading {file_extension} file directly (bypassing docling)")
-            with open(temp_file_path, "r", encoding="utf-8") as f:
-                raw_content = f.read()
-
-            # For JSON files, pretty-print for better readability
-            if file_extension.lower() == ".json":
-                try:
-                    parsed = json.loads(raw_content)
-                    raw_content = json.dumps(parsed, indent=2, ensure_ascii=False)
-                except json.JSONDecodeError:
-                    logger.warning(
-                        "JSON file is not valid JSON, treating as plain text"
-                    )
-
-            docling_metadata = {
-                "num_pages": None,
-                "document_type": "PlainText",
-            }
-
-            # Token-based chunking for plain text
-            tokens = hf_tokenizer.encode(raw_content, add_special_tokens=False)
-            total_tokens = len(tokens)
-            logger.info(
-                f"Total tokens in file: {total_tokens}, chunking with max_tokens={max_tokens}"
+        chunk_texts = []
+        for chunk in mps_chunks:
+            contextualized = chunk.get("contextualized_text") or chunk["chunk_text"]
+            chunk_records.append(
+                KnowledgeBaseChunkModel(
+                    document_id=document_id,
+                    organization_id=organization_id,
+                    chunk_text=chunk["chunk_text"],
+                    contextualized_text=contextualized,
+                    chunk_index=chunk["chunk_index"],
+                    chunk_metadata=chunk.get("chunk_metadata") or {},
+                    embedding_model=embedding_service.get_model_id(),
+                    embedding_dimension=embedding_service.get_embedding_dimension(),
+                    token_count=chunk.get("token_count", 0),
+                )
            )
+            chunk_texts.append(contextualized)

-            start = 0
-            chunk_index = 0
-            while start < total_tokens:
-                end = min(start + max_tokens, total_tokens)
-                chunk_token_ids = tokens[start:end]
-                chunk_text = hf_tokenizer.decode(
-                    chunk_token_ids, skip_special_tokens=True
-                )
-
-                token_count = len(chunk_token_ids)
-                token_counts.append(token_count)
-
-                chunk_record = KnowledgeBaseChunkModel(
-                    document_id=document_id,
-                    organization_id=organization_id,
-                    chunk_text=chunk_text,
-                    contextualized_text=chunk_text,
-                    chunk_index=chunk_index,
-                    chunk_metadata={},
-                    embedding_model=service.get_model_id(),
-                    embedding_dimension=service.get_embedding_dimension(),
-                    token_count=token_count,
-                )
-
-                chunk_records.append(chunk_record)
-                chunk_texts.append(chunk_text)
-                chunk_index += 1
-                start = end
-
-            total_chunks = len(chunk_records)
-            logger.info(f"Generated {total_chunks} chunks from plain text")
-
-        else:
-            # Use docling for structured formats (PDF, DOCX, etc.)
-            logger.info("Converting document with docling")
-            converter = DocumentConverter()
-            conversion_result = converter.convert(temp_file_path)
-            doc = conversion_result.document
-
-            docling_metadata = {
-                "num_pages": len(doc.pages) if hasattr(doc, "pages") else None,
-                "document_type": type(doc).__name__,
-            }
-
-            # Initialize chunker
-            logger.info(f"Initializing HybridChunker with max_tokens={max_tokens}")
-            chunker = HybridChunker(tokenizer=tokenizer)
-
-            # Chunk the document
-            logger.info(f"Chunking document with max_tokens={max_tokens}")
-            chunks = list(chunker.chunk(dl_doc=doc))
-            total_chunks = len(chunks)
-            logger.info(f"Generated {total_chunks} chunks")
-
-            # Process each chunk
-            for i, chunk in enumerate(chunks):
-                chunk_text = chunk.text
-                contextualized_text = chunker.contextualize(chunk=chunk)
-
-                text_to_tokenize = (
-                    contextualized_text if contextualized_text else chunk_text
-                )
-                token_count = len(
-                    tokenizer.tokenizer.encode(
-                        text_to_tokenize, add_special_tokens=False
-                    )
-                )
-                token_counts.append(token_count)
-
-                chunk_metadata = {}
-                if hasattr(chunk, "meta") and chunk.meta:
-                    chunk_metadata = {
-                        "doc_items": (
-                            [str(item) for item in chunk.meta.doc_items]
-                            if hasattr(chunk.meta, "doc_items")
-                            else []
-                        ),
-                        "headings": (
-                            chunk.meta.headings
-                            if hasattr(chunk.meta, "headings")
-                            else []
-                        ),
-                    }
-
-                chunk_record = KnowledgeBaseChunkModel(
-                    document_id=document_id,
-                    organization_id=organization_id,
-                    chunk_text=chunk_text,
-                    contextualized_text=contextualized_text,
-                    chunk_index=i,
-                    chunk_metadata=chunk_metadata,
-                    embedding_model=service.get_model_id(),
-                    embedding_dimension=service.get_embedding_dimension(),
-                    token_count=token_count,
-                )
-
-                chunk_records.append(chunk_record)
-                chunk_texts.append(text_to_tokenize)
-
-        # Log chunk statistics
-        if token_counts:
-            avg_tokens = sum(token_counts) / len(token_counts)
-            min_tokens = min(token_counts)
-            max_tokens_actual = max(token_counts)
-            logger.info("Chunk token statistics:")
-            logger.info(f"  - Average: {avg_tokens:.1f} tokens")
-            logger.info(f"  - Min: {min_tokens} tokens")
-            logger.info(f"  - Max: {max_tokens_actual} tokens")
-
-        # Step 6: Generate embeddings using OpenAI
-        logger.info(f"Generating embeddings using {service.get_model_id()}")
-        embeddings = await service.embed_texts(chunk_texts)
-
-        # Step 7: Attach embeddings to chunk records
+        logger.info(
+            f"Generating embeddings for {len(chunk_texts)} chunks "
+            f"using {embedding_service.get_model_id()}"
+        )
+        embeddings = await embedding_service.embed_texts(chunk_texts)
        for chunk_record, embedding in zip(chunk_records, embeddings):
            chunk_record.embedding = embedding

-        # Step 8: Save chunks in database
        logger.info("Storing chunks in database")
        await db_client.create_chunks_batch(chunk_records)

-        # Step 9: Update document status to completed
        await db_client.update_document_status(
            document_id,
            "completed",
-            total_chunks=total_chunks,
+            total_chunks=len(chunk_records),
            docling_metadata=docling_metadata,
        )

        logger.info(
            f"Successfully processed knowledge base document {document_id}. "
-            f"Total chunks: {total_chunks}"
+            f"Total chunks: {len(chunk_records)}"
        )

    except Exception as e:
@ -390,14 +229,12 @@ async def process_knowledge_base_document(
            f"Error processing knowledge base document {document_id}: {e}",
            exc_info=True,
        )
-        # Update document status to failed
        await db_client.update_document_status(
            document_id, "failed", error_message=str(e)
        )
        raise

    finally:
-        # Clean up temp file
        if temp_file_path and os.path.exists(temp_file_path):
            try:
                os.remove(temp_file_path)
--- a/api/tasks/run_integrations.py
+++ b/api/tasks/run_integrations.py
@ -5,12 +5,19 @@ from typing import Any, Dict, Optional

 import httpx
 from loguru import logger
+from pydantic import ValidationError

 from api.constants import BACKEND_API_ENDPOINT
 from api.db import db_client
 from api.db.models import WorkflowRunModel
 from api.enums import OrganizationConfigurationKey
 from api.services.pipecat.tracing_config import register_org_langfuse_credentials
+from api.services.workflow.dto import (
+    QANodeData,
+    QARFNode,
+    WebhookNodeData,
+    WebhookRFNode,
+)
 from api.services.workflow.qa import run_per_node_qa_analysis
 from api.utils.credential_auth import build_auth_header
 from api.utils.template_renderer import render_template
@ -19,34 +26,34 @@ from pipecat.utils.run_context import set_current_org_id, set_current_run_id


 def _should_skip_qa(
-    node_data: dict,
+    qa_data: QANodeData,
    workflow_run: WorkflowRunModel,
 ) -> str | None:
    """Check whether QA analysis should be skipped for this call.

    Returns a reason string if the call should be skipped, or None if it should proceed.
    """
-    # Check minimum call duration
-    min_duration = node_data.get("qa_min_call_duration", 15)
    usage_info = workflow_run.usage_info or {}
    call_duration = usage_info.get("call_duration_seconds")
-    if call_duration is not None and call_duration < min_duration:
-        return f"call duration ({call_duration:.1f}s) below minimum ({min_duration}s)"
+    if call_duration is not None and call_duration < qa_data.qa_min_call_duration:
+        return (
+            f"call duration ({call_duration:.1f}s) below minimum "
+            f"({qa_data.qa_min_call_duration}s)"
+        )

-    # Check voicemail calls
-    qa_voicemail_calls = node_data.get("qa_voicemail_calls", False)
-    if not qa_voicemail_calls:
+    if not qa_data.qa_voicemail_calls:
        gathered_context = workflow_run.gathered_context or {}
        call_disposition = gathered_context.get("call_disposition", "")
        if call_disposition == EndTaskReason.VOICEMAIL_DETECTED.value:
            return "voicemail call and QA voicemail calls is disabled"

-    # Check sample rate
-    sample_rate = node_data.get("qa_sample_rate", 100)
-    if sample_rate < 100:
+    if qa_data.qa_sample_rate < 100:
        roll = random.randint(1, 100)
-        if roll > sample_rate:
-            return f"excluded by sampling ({sample_rate}% sample rate, rolled {roll})"
+        if roll > qa_data.qa_sample_rate:
+            return (
+                f"excluded by sampling ({qa_data.qa_sample_rate}% sample rate, "
+                f"rolled {roll})"
+            )

    return None

@ -66,15 +73,22 @@ async def _run_qa_nodes(
    results: Dict[str, Any] = {}

    for node in qa_nodes:
-        node_data = node.get("data", {})
        node_id = node.get("id", "unknown")
-        node_name = node_data.get("name", "QA Analysis")
+        try:
+            qa_node = QARFNode.model_validate(node)
+        except ValidationError as e:
+            logger.warning(f"QA node #{node_id} failed validation, skipping: {e}")
+            results[f"qa_{node_id}"] = {"error": "validation_failed"}
+            continue

-        if not node_data.get("qa_enabled", True):
+        qa_data = qa_node.data
+        node_name = qa_data.name
+
+        if not qa_data.qa_enabled:
            logger.debug(f"QA node '{node_name}' is disabled, skipping")
            continue

-        skip_reason = _should_skip_qa(node_data, workflow_run)
+        skip_reason = _should_skip_qa(qa_data, workflow_run)
        if skip_reason:
            logger.info(f"Skipping QA node '{node_name}' (#{node_id}): {skip_reason}")
            results[f"qa_{node_id}"] = {"skipped": True, "reason": skip_reason}
@ -83,7 +97,7 @@ async def _run_qa_nodes(
        try:
            logger.info(f"Running QA analysis for node '{node_name}' (#{node_id})")
            result = await run_per_node_qa_analysis(
-                node_data,
+                qa_data,
                workflow_run,
                workflow_run_id,
                workflow_definition,
@ -260,7 +274,16 @@ async def run_integrations_post_workflow_run(_ctx, workflow_run_id: int):

        # Step 8: Execute each webhook node
        for node in webhook_nodes:
-            webhook_data = node.get("data", {})
+            node_id = node.get("id", "unknown")
+            try:
+                webhook_node = WebhookRFNode.model_validate(node)
+            except ValidationError as e:
+                logger.warning(
+                    f"Webhook node #{node_id} failed validation, skipping: {e}"
+                )
+                continue
+
+            webhook_data = webhook_node.data
            try:
                await _execute_webhook_node(
                    webhook_data=webhook_data,
@ -268,10 +291,7 @@ async def run_integrations_post_workflow_run(_ctx, workflow_run_id: int):
                    organization_id=organization_id,
                )
            except Exception as e:
-                # Log error but continue with other webhooks
-                logger.warning(
-                    f"Failed to execute webhook '{webhook_data.get('name', 'unknown')}': {e}"
-                )
+                logger.warning(f"Failed to execute webhook '{webhook_data.name}': {e}")

    except Exception as e:
        logger.error(f"Error running integrations: {e}", exc_info=True)
@ -323,7 +343,7 @@ def _build_render_context(


 async def _execute_webhook_node(
-    webhook_data: Dict[str, Any],
+    webhook_data: WebhookNodeData,
    render_context: Dict[str, Any],
    organization_id: int,
 ) -> bool:
@ -331,31 +351,27 @@ async def _execute_webhook_node(
    Execute a single webhook node.

    Args:
-        webhook_data: The webhook node's data dict from workflow definition
+        webhook_data: The validated webhook node data
        render_context: Context for template rendering
        organization_id: For credential lookup

    Returns:
        True if successful, False otherwise
    """
-    webhook_name = webhook_data.get("name", "Unnamed Webhook")
+    webhook_name = webhook_data.name

-    # 1. Check if enabled
-    if not webhook_data.get("enabled", True):
+    if not webhook_data.enabled:
        logger.debug(f"Webhook '{webhook_name}' is disabled, skipping")
        return True

-    # 2. Validate endpoint URL
-    url = webhook_data.get("endpoint_url")
+    url = webhook_data.endpoint_url
    if not url:
        logger.warning(f"Webhook '{webhook_name}' has no endpoint URL")
        return False

-    # 3. Build headers
    headers = {"Content-Type": "application/json"}

-    # 4. Add auth header if credential configured
-    credential_uuid = webhook_data.get("credential_uuid")
+    credential_uuid = webhook_data.credential_uuid
    if credential_uuid:
        credential = await db_client.get_credential_by_uuid(
            credential_uuid, organization_id
@ -369,18 +385,13 @@ async def _execute_webhook_node(
                f"Credential {credential_uuid} not found for webhook '{webhook_name}'"
            )

-    # 5. Add custom headers
-    custom_headers = webhook_data.get("custom_headers", [])
-    for h in custom_headers:
-        if h.get("key") and h.get("value"):
-            headers[h["key"]] = h["value"]
+    for h in webhook_data.custom_headers or []:
+        if h.key and h.value:
+            headers[h.key] = h.value

-    # 6. Render payload template
-    payload_template = webhook_data.get("payload_template", {})
-    payload = render_template(payload_template, render_context)
+    payload = render_template(webhook_data.payload_template or {}, render_context)

-    # 7. Make HTTP request
-    method = webhook_data.get("http_method", "POST").upper()
+    method = (webhook_data.http_method or "POST").upper()

    logger.info(f"Executing webhook '{webhook_name}': {method}")

--- a/api/tests/conftest.py
+++ b/api/tests/conftest.py
@ -14,14 +14,17 @@ from unittest.mock import Mock
 import pytest

 from api.services.workflow.dto import (
+    AgentNodeData,
+    AgentRFNode,
    EdgeDataDTO,
+    EndCallNodeData,
+    EndCallRFNode,
    ExtractionVariableDTO,
-    NodeDataDTO,
-    NodeType,
    Position,
    ReactFlowDTO,
    RFEdgeDTO,
-    RFNodeDTO,
+    StartCallNodeData,
+    StartCallRFNode,
    VariableType,
 )
 from api.services.workflow.workflow import WorkflowGraph
@ -252,11 +255,10 @@ def simple_workflow() -> WorkflowGraph:
    """
    dto = ReactFlowDTO(
        nodes=[
-            RFNodeDTO(
+            StartCallRFNode(
                id="start",
-                type=NodeType.startNode,
                position=Position(x=0, y=0),
-                data=NodeDataDTO(
+                data=StartCallNodeData(
                    name="Start Call",
                    prompt=START_CALL_SYSTEM_PROMPT,
                    is_start=True,
@ -273,11 +275,10 @@ def simple_workflow() -> WorkflowGraph:
                    ],
                ),
            ),
-            RFNodeDTO(
+            EndCallRFNode(
                id="end",
-                type=NodeType.endNode,
                position=Position(x=0, y=200),
-                data=NodeDataDTO(
+                data=EndCallNodeData(
                    name="End Call",
                    prompt=END_CALL_SYSTEM_PROMPT,
                    is_end=True,
@ -317,11 +318,10 @@ def three_node_workflow() -> WorkflowGraph:
    """
    dto = ReactFlowDTO(
        nodes=[
-            RFNodeDTO(
+            StartCallRFNode(
                id="start",
-                type=NodeType.startNode,
                position=Position(x=0, y=0),
-                data=NodeDataDTO(
+                data=StartCallNodeData(
                    name="Start Call",
                    prompt=START_CALL_SYSTEM_PROMPT,
                    is_start=True,
@ -338,11 +338,10 @@ def three_node_workflow() -> WorkflowGraph:
                    ],
                ),
            ),
-            RFNodeDTO(
+            AgentRFNode(
                id="agent",
-                type=NodeType.agentNode,
                position=Position(x=0, y=200),
-                data=NodeDataDTO(
+                data=AgentNodeData(
                    name="Collect Info",
                    prompt=AGENT_SYSTEM_PROMPT,
                    allow_interrupt=False,
@ -358,11 +357,10 @@ def three_node_workflow() -> WorkflowGraph:
                    ],
                ),
            ),
-            RFNodeDTO(
+            EndCallRFNode(
                id="end",
-                type=NodeType.endNode,
                position=Position(x=0, y=400),
-                data=NodeDataDTO(
+                data=EndCallNodeData(
                    name="End Call",
                    prompt=END_CALL_SYSTEM_PROMPT,
                    is_end=True,
@ -411,11 +409,10 @@ def three_node_workflow_extraction_start_only() -> WorkflowGraph:
    """
    dto = ReactFlowDTO(
        nodes=[
-            RFNodeDTO(
+            StartCallRFNode(
                id="start",
-                type=NodeType.startNode,
                position=Position(x=0, y=0),
-                data=NodeDataDTO(
+                data=StartCallNodeData(
                    name="Start Call",
                    prompt=START_CALL_SYSTEM_PROMPT,
                    is_start=True,
@ -432,11 +429,10 @@ def three_node_workflow_extraction_start_only() -> WorkflowGraph:
                    ],
                ),
            ),
-            RFNodeDTO(
+            AgentRFNode(
                id="agent",
-                type=NodeType.agentNode,
                position=Position(x=0, y=200),
-                data=NodeDataDTO(
+                data=AgentNodeData(
                    name="Collect Info",
                    prompt=AGENT_SYSTEM_PROMPT,
                    allow_interrupt=False,
@ -444,11 +440,10 @@ def three_node_workflow_extraction_start_only() -> WorkflowGraph:
                    extraction_enabled=False,  # Explicitly disabled for testing
                ),
            ),
-            RFNodeDTO(
+            EndCallRFNode(
                id="end",
-                type=NodeType.endNode,
                position=Position(x=0, y=400),
-                data=NodeDataDTO(
+                data=EndCallNodeData(
                    name="End Call",
                    prompt=END_CALL_SYSTEM_PROMPT,
                    is_end=True,
@ -493,11 +488,10 @@ def three_node_workflow_no_variable_extraction() -> WorkflowGraph:
    """
    dto = ReactFlowDTO(
        nodes=[
-            RFNodeDTO(
+            StartCallRFNode(
                id="start",
-                type=NodeType.startNode,
                position=Position(x=0, y=0),
-                data=NodeDataDTO(
+                data=StartCallNodeData(
                    name="Start Call",
                    prompt=START_CALL_SYSTEM_PROMPT,
                    is_start=True,
@ -506,11 +500,10 @@ def three_node_workflow_no_variable_extraction() -> WorkflowGraph:
                    extraction_enabled=False,
                ),
            ),
-            RFNodeDTO(
+            AgentRFNode(
                id="agent",
-                type=NodeType.agentNode,
                position=Position(x=0, y=200),
-                data=NodeDataDTO(
+                data=AgentNodeData(
                    name="Collect Info",
                    prompt=AGENT_SYSTEM_PROMPT,
                    allow_interrupt=False,
@ -518,11 +511,10 @@ def three_node_workflow_no_variable_extraction() -> WorkflowGraph:
                    extraction_enabled=False,  # Explicitly disabled for testing
                ),
            ),
-            RFNodeDTO(
+            EndCallRFNode(
                id="end",
-                type=NodeType.endNode,
                position=Position(x=0, y=400),
-                data=NodeDataDTO(
+                data=EndCallNodeData(
                    name="End Call",
                    prompt=END_CALL_SYSTEM_PROMPT,
                    is_end=True,
--- a/api/tests/test_display_options_evaluator.py
+++ b/api/tests/test_display_options_evaluator.py
@ -0,0 +1,39 @@
+"""Golden-test parity for the display_options evaluator.
+
+Both the Python `evaluate_display_options` and the TypeScript
+`evaluateDisplayOptions` (in `ui/src/components/flow/renderer/displayOptions.ts`)
+must agree on every fixture in `display_options_fixtures.json`. The TS
+side is verified by `ui/scripts/test-display-options.mjs`.
+"""
+
+import json
+from pathlib import Path
+
+import pytest
+
+from api.services.workflow.node_specs import evaluate_display_options
+
+FIXTURES_PATH = (
+    Path(__file__).parent.parent
+    / "services"
+    / "workflow"
+    / "node_specs"
+    / "display_options_fixtures.json"
+)
+
+
+def load_cases():
+    with open(FIXTURES_PATH) as f:
+        return json.load(f)["cases"]
+
+
+@pytest.mark.parametrize("case", load_cases(), ids=lambda c: c["name"])
+def test_python_evaluator_matches_fixture(case):
+    rules = case["rules"]
+    values = case["values"]
+    expected = case["expected"]
+    actual = evaluate_display_options(rules, values)
+    assert actual is expected, (
+        f"{case['name']}: expected {expected}, got {actual} "
+        f"for rules={rules!r} values={values!r}"
+    )
--- a/api/tests/test_dograh_sdk.py
+++ b/api/tests/test_dograh_sdk.py
@ -0,0 +1,235 @@
+"""Tests for the Python runtime SDK (`dograh_sdk`).
+
+Uses a stub client backed by the in-process spec registry rather than
+exercising the HTTP layer — the HTTP client is a thin wrapper that's
+easier to test manually against a live server.
+
+Covers:
+- Workflow builder round-trips through ReactFlowDTO validation
+- Validation errors fail at the `add()` call site
+- from_json preserves node IDs and subsequent add() doesn't collide
+- Edge labels / conditions are required
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import pytest
+from dograh_sdk import Workflow
+from dograh_sdk._generated_models import NodeSpec
+from dograh_sdk.errors import ValidationError
+
+from api.services.workflow.dto import ReactFlowDTO
+from api.services.workflow.node_specs import all_specs, get_spec
+
+
+class _StubClient:
+    """Stand-in for DograhClient backed by the in-process spec registry.
+    Matches the real client's contract: `get_node_type(name)` returns a
+    `NodeSpec` Pydantic model."""
+
+    def get_node_type(self, name: str) -> NodeSpec:
+        spec = get_spec(name)
+        if spec is None:
+            raise ValueError(f"Unknown spec: {name}")
+        return NodeSpec.model_validate(spec.model_dump(mode="json"))
+
+
+@pytest.fixture
+def client() -> _StubClient:
+    return _StubClient()
+
+
+# ─── Builder + to_json round-trip ────────────────────────────────────────
+
+
+def test_builds_minimal_workflow_and_roundtrips_through_dto(client: _StubClient):
+    wf = Workflow(client=client, name="minimal")
+    start = wf.add(
+        type="startCall",
+        name="greeting",
+        prompt="Say hi to the caller.",
+    )
+    end = wf.add(
+        type="endCall",
+        name="close",
+        prompt="Thank the caller and hang up.",
+    )
+    wf.edge(start, end, label="done", condition="When the greeting is complete")
+
+    payload = wf.to_json()
+    # Wire format must validate through the backend Pydantic union — if
+    # it doesn't, the SDK has silently drifted from the spec schema.
+    dto = ReactFlowDTO.model_validate(payload)
+    assert len(dto.nodes) == 2
+    assert {n.type for n in dto.nodes} == {"startCall", "endCall"}
+    assert len(dto.edges) == 1
+
+
+def test_defaults_applied_from_spec(client: _StubClient):
+    """Spec defaults (e.g., `allow_interrupt=False` on startCall) fill in
+    when the user doesn't pass them."""
+    wf = Workflow(client=client, name="defaults")
+    start = wf.add(type="startCall", name="greeting", prompt="hello")
+    payload = wf.to_json()
+    data = payload["nodes"][0]["data"]
+    assert data["allow_interrupt"] is False  # spec default
+    assert data["add_global_prompt"] is True  # spec default
+    _ = start  # used implicitly; silence unused
+
+
+def test_webhook_complex_fields_validate(client: _StubClient):
+    """Webhook's json + fixed_collection (custom_headers) round-trip."""
+    wf = Workflow(client=client, name="wh")
+    wh = wf.add(
+        type="webhook",
+        name="notify",
+        enabled=True,
+        http_method="POST",
+        endpoint_url="https://api.example.com/hook",
+        custom_headers=[{"key": "X-Source", "value": "dograh"}],
+        payload_template={"run": "{{workflow_run_id}}"},
+    )
+    payload = wf.to_json()
+    # Webhook has no incoming/outgoing graph requirements — render as a
+    # standalone node in the graph for the DTO round-trip.
+    ReactFlowDTO.model_validate(payload)
+    _ = wh
+
+
+# ─── Validation errors at call site ──────────────────────────────────────
+
+
+def test_unknown_field_raises_at_add(client: _StubClient):
+    wf = Workflow(client=client, name="typo")
+    with pytest.raises(ValidationError, match="unknown field"):
+        wf.add(
+            type="startCall",
+            name="greeting",
+            prompt="hi",
+            promt="typo",  # extra misspelled field
+        )
+
+
+def test_missing_required_raises_at_add(client: _StubClient):
+    wf = Workflow(client=client, name="missing")
+    with pytest.raises(ValidationError, match="required field missing"):
+        wf.add(type="startCall", name="greeting")  # no prompt
+
+
+def test_wrong_scalar_type_raises(client: _StubClient):
+    wf = Workflow(client=client, name="wrongtype")
+    with pytest.raises(ValidationError, match="expected boolean"):
+        wf.add(
+            type="agentNode",
+            name="x",
+            prompt="y",
+            allow_interrupt="yes",
+        )
+
+
+def test_invalid_options_value_raises(client: _StubClient):
+    wf = Workflow(client=client, name="wrongenum")
+    with pytest.raises(ValidationError, match="not in allowed"):
+        wf.add(
+            type="startCall",
+            name="greeting",
+            prompt="hi",
+            greeting_type="video",  # only text|audio allowed
+        )
+
+
+def test_unknown_node_type_raises(client: _StubClient):
+    wf = Workflow(client=client, name="x")
+    with pytest.raises(ValueError, match="Unknown spec"):
+        wf.add(type="nonExistentType", name="x")
+
+
+def test_validation_error_surfaces_llm_hint(client: _StubClient):
+    """When a property carries `llm_hint`, it appears in the error message
+    so LLMs can self-correct on retry. `tool_uuids` on agentNode has the
+    hint 'List of tool UUIDs from `list_tools`.'"""
+    wf = Workflow(client=client, name="hint")
+    with pytest.raises(ValidationError) as exc_info:
+        wf.add(
+            type="agentNode",
+            name="x",
+            prompt="y",
+            tool_uuids="single-uuid-not-a-list",  # wrong shape: str, not list
+        )
+    msg = str(exc_info.value)
+    assert "tool_uuids" in msg
+    assert "Hint:" in msg
+    assert "list_tools" in msg
+
+
+def test_no_hint_message_when_spec_has_none(client: _StubClient):
+    """Properties without `llm_hint` produce a plain error (no dangling
+    'Hint:' line)."""
+    wf = Workflow(client=client, name="no-hint")
+    with pytest.raises(ValidationError) as exc_info:
+        wf.add(type="agentNode", name="x", prompt="y", allow_interrupt="yes")
+    assert "Hint:" not in str(exc_info.value)
+
+
+def test_edge_requires_label_and_condition(client: _StubClient):
+    wf = Workflow(client=client, name="edge")
+    a = wf.add(type="startCall", name="a", prompt="hi")
+    b = wf.add(type="endCall", name="b", prompt="bye")
+    with pytest.raises(ValidationError, match="label is required"):
+        wf.edge(a, b, label="", condition="condition")
+    with pytest.raises(ValidationError, match="condition is required"):
+        wf.edge(a, b, label="label", condition="")
+
+
+# ─── Round-trip from_json → edit → to_json ────────────────────────────────
+
+
+def test_from_json_preserves_ids_and_next_id_doesnt_collide(client: _StubClient):
+    wf0 = Workflow(client=client, name="w0")
+    start = wf0.add(type="startCall", name="g", prompt="hi")
+    end = wf0.add(type="endCall", name="e", prompt="bye")
+    wf0.edge(start, end, label="done", condition="done")
+
+    payload = wf0.to_json()
+    wf1 = Workflow.from_json(payload, client=client, name="w0-reload")
+
+    # IDs are preserved
+    assert [n.id for n in wf1._nodes] == [start.id, end.id]
+    # Next add() gets a fresh ID, not colliding with the existing ones
+    new_ref = wf1.add(type="agentNode", name="qualify", prompt="ask stuff")
+    assert new_ref.id != start.id
+    assert new_ref.id != end.id
+    assert int(new_ref.id) > max(int(start.id), int(end.id))
+
+
+def test_from_json_validates_data(client: _StubClient):
+    """Loading a JSON payload with a misnamed field raises — we don't
+    silently accept drift."""
+    bad = {
+        "nodes": [
+            {
+                "id": "1",
+                "type": "startCall",
+                "position": {"x": 0, "y": 0},
+                "data": {"name": "g", "prompt": "hi", "bogus": 1},
+            }
+        ],
+        "edges": [],
+    }
+    with pytest.raises(ValidationError, match="unknown field"):
+        Workflow.from_json(bad, client=client)
+
+
+# ─── Sanity: all registered specs are reachable by name ───────────────────
+
+
+def test_every_registered_spec_is_reachable_by_sdk(client: _StubClient):
+    wf = Workflow(client=client, name="probe")
+    for spec in all_specs():
+        # Just fetch the spec via the client; doesn't add anything. This
+        # ensures the `_StubClient` wiring works for all types.
+        probe = client.get_node_type(spec.name)
+        assert probe.name == spec.name
+    _ = wf
--- a/api/tests/test_dograh_sdk_typed.py
+++ b/api/tests/test_dograh_sdk_typed.py
@ -0,0 +1,128 @@
+"""Tests for the typed SDK (`dograh_sdk.typed`).
+
+Covers:
+- Generated classes import cleanly and declare the correct spec name
+- `Workflow.add_typed(node)` produces the same wire format as
+  `Workflow.add(type=..., **kwargs)`
+- Typed-class construction respects required/optional field defaults
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import pytest
+from dograh_sdk import Workflow
+from dograh_sdk._generated_models import NodeSpec
+from dograh_sdk.typed import (
+    AgentNode,
+    EndCall,
+    GlobalNode,
+    Qa,
+    StartCall,
+    Trigger,
+    TypedNode,
+    Webhook,
+)
+
+from api.services.workflow.dto import ReactFlowDTO
+from api.services.workflow.node_specs import get_spec
+
+
+class _StubClient:
+    def get_node_type(self, name: str) -> NodeSpec:
+        return NodeSpec.model_validate(get_spec(name).model_dump(mode="json"))
+
+
+@pytest.fixture
+def client() -> _StubClient:
+    return _StubClient()
+
+
+# ─── Generated classes declare the correct discriminator ──────────────────
+
+
+@pytest.mark.parametrize(
+    "cls,expected_type",
+    [
+        (StartCall, "startCall"),
+        (AgentNode, "agentNode"),
+        (EndCall, "endCall"),
+        (GlobalNode, "globalNode"),
+        (Trigger, "trigger"),
+        (Webhook, "webhook"),
+        (Qa, "qa"),
+    ],
+    ids=lambda v: v.__name__ if isinstance(v, type) else v,
+)
+def test_typed_class_declares_spec_name(cls: type[TypedNode], expected_type: str):
+    assert cls.type == expected_type
+    # Instances inherit the ClassVar
+    if cls is StartCall:
+        inst = cls(name="g", prompt="hi")
+    elif cls is AgentNode:
+        inst = cls(name="a", prompt="hi")
+    elif cls is EndCall:
+        inst = cls(name="e", prompt="hi")
+    elif cls is GlobalNode:
+        inst = cls(name="g", prompt="hi")
+    elif cls is Trigger:
+        inst = cls(name="t")
+    elif cls is Webhook:
+        inst = cls(name="wh")
+    else:  # Qa
+        inst = cls(name="qa")
+    assert inst.type == expected_type
+
+
+# ─── add_typed integrates with Workflow and round-trips through DTO ──────
+
+
+def test_add_typed_builds_valid_workflow(client: _StubClient):
+    wf = Workflow(client=client, name="typed-e2e")
+    start = wf.add_typed(StartCall(name="greeting", prompt="Hi there!"))
+    end = wf.add_typed(EndCall(name="done", prompt="Bye."))
+    wf.edge(start, end, label="done", condition="conversation over")
+
+    payload = wf.to_json()
+    dto = ReactFlowDTO.model_validate(payload)
+    assert len(dto.nodes) == 2
+    assert payload["nodes"][0]["type"] == "startCall"
+    assert payload["nodes"][1]["type"] == "endCall"
+
+
+def test_add_typed_and_add_produce_identical_data(client: _StubClient):
+    """The typed path and the generic path should produce identical node
+    data for equivalent inputs."""
+    wf_typed = Workflow(client=client)
+    wf_typed.add_typed(AgentNode(name="q", prompt="ask"))
+
+    wf_generic = Workflow(client=client)
+    wf_generic.add(type="agentNode", name="q", prompt="ask")
+
+    typed_data = wf_typed.to_json()["nodes"][0]["data"]
+    generic_data = wf_generic.to_json()["nodes"][0]["data"]
+    assert typed_data == generic_data
+
+
+def test_webhook_mutable_defaults_dont_share_state(client: _StubClient):
+    """Dataclass default_factory ensures every Webhook() gets its own dict."""
+    wf = Workflow(client=client)
+    a = wf.add_typed(Webhook(name="a"))
+    b = wf.add_typed(Webhook(name="b"))
+    payload = wf.to_json()
+    a_data = payload["nodes"][0]["data"]
+    b_data = payload["nodes"][1]["data"]
+    # Both instances must end up with payload_template populated from the
+    # factory; mutating one must not affect the other.
+    assert a_data["payload_template"] is not b_data["payload_template"]
+    _ = a, b
+
+
+def test_typed_sdk_surfaces_spec_default_to_field(client: _StubClient):
+    """Spec defaults make it all the way through: StartCall().name defaults
+    to the spec's `"Start Call"` literal."""
+    s = StartCall(prompt="hi")
+    assert s.name == "Start Call"
+    assert s.allow_interrupt is False  # matches spec default from earlier edits
+    assert s.add_global_prompt is True
--- a/api/tests/test_dto.py
+++ b/api/tests/test_dto.py
@ -1,11 +1,98 @@
+from pathlib import Path
+
 import pytest

-from api.services.workflow.dto import ReactFlowDTO
+from api.services.workflow.dto import ReactFlowDTO, sanitize_workflow_definition
+
+_FIXTURES_DIR = Path(__file__).parent / "definitions"


@pytest.mark.asyncio
 async def test_dto():
-    # assert no exceptions are raised
-    with open("tests/definitions/rf-1.json", "r") as f:
+    # Path resolved relative to this test file so the test works regardless
+    # of the cwd pytest is invoked from.
+    with open(_FIXTURES_DIR / "rf-1.json", "r") as f:
        dto = ReactFlowDTO.model_validate_json(f.read())
    assert dto is not None
+
+
+def test_sanitize_strips_ui_runtime_fields():
+    definition = {
+        "viewport": {"x": 0, "y": 0, "zoom": 1},
+        "nodes": [
+            {
+                "id": "n1",
+                "type": "startCall",
+                "position": {"x": 0, "y": 0},
+                "width": 200,  # ReactFlow-computed, preserved
+                "selected": True,  # ReactFlow runtime, preserved
+                "data": {
+                    "name": "Start",
+                    "prompt": "hi",
+                    "greeting": "hello",
+                    "invalid": True,  # UI-only, should be stripped
+                    "validationMessage": "oops",  # UI-only, should be stripped
+                    "mystery_field": 42,  # unknown, should be stripped
+                },
+            },
+            {
+                "id": "n2",
+                "type": "agentNode",
+                "position": {"x": 1, "y": 1},
+                "data": {"name": "A", "prompt": "p", "invalid": False},
+            },
+        ],
+        "edges": [
+            {
+                "id": "e1",
+                "source": "n1",
+                "target": "n2",
+                "data": {
+                    "label": "next",
+                    "condition": "true",
+                    "invalid": True,  # UI-only, should be stripped
+                },
+            }
+        ],
+    }
+
+    out = sanitize_workflow_definition(definition)
+
+    # Top-level keys preserved
+    assert out["viewport"] == {"x": 0, "y": 0, "zoom": 1}
+    # ReactFlow runtime fields on the node itself preserved
+    assert out["nodes"][0]["width"] == 200
+    assert out["nodes"][0]["selected"] is True
+
+    # node.data stripped of unknowns, known fields kept
+    n1_data = out["nodes"][0]["data"]
+    assert n1_data == {"name": "Start", "prompt": "hi", "greeting": "hello"}
+    assert "invalid" not in n1_data
+    assert "validationMessage" not in n1_data
+    assert "mystery_field" not in n1_data
+
+    n2_data = out["nodes"][1]["data"]
+    assert n2_data == {"name": "A", "prompt": "p"}
+
+    # edge.data stripped
+    assert out["edges"][0]["data"] == {"label": "next", "condition": "true"}
+
+
+def test_sanitize_noop_on_empty_and_unknown_types():
+    assert sanitize_workflow_definition(None) is None
+    assert sanitize_workflow_definition({}) == {}
+
+    # Unknown node type: pass through unchanged rather than wipe data
+    definition = {
+        "nodes": [
+            {
+                "id": "n1",
+                "type": "unknownType",
+                "position": {"x": 0, "y": 0},
+                "data": {"anything": "goes"},
+            }
+        ],
+        "edges": [],
+    }
+    out = sanitize_workflow_definition(definition)
+    assert out["nodes"][0]["data"] == {"anything": "goes"}
--- a/api/tests/test_layout.py
+++ b/api/tests/test_layout.py
@ -0,0 +1,124 @@
+"""Tests for position reconciliation after the LLM save round-trip."""
+
+from __future__ import annotations
+
+from api.services.workflow.layout import reconcile_positions
+
+
+def _node(
+    id: str,
+    type: str,
+    *,
+    name: str | None = None,
+    x: float = 0.0,
+    y: float = 0.0,
+) -> dict:
+    data: dict = {}
+    if name is not None:
+        data["name"] = name
+    return {"id": id, "type": type, "position": {"x": x, "y": y}, "data": data}
+
+
+def _edge(src: str, tgt: str) -> dict:
+    return {
+        "id": f"{src}-{tgt}",
+        "source": src,
+        "target": tgt,
+        "data": {"label": "x", "condition": "y"},
+    }
+
+
+def test_named_match_preserves_position():
+    previous = {
+        "nodes": [_node("99", "startCall", name="greeting", x=100, y=200)],
+        "edges": [],
+    }
+    new = {
+        "nodes": [_node("1", "startCall", name="greeting")],
+        "edges": [],
+    }
+    out = reconcile_positions(new, previous)
+    assert out["nodes"][0]["position"] == {"x": 100, "y": 200}
+
+
+def test_unnamed_match_by_type_ordering():
+    previous = {
+        "nodes": [
+            _node("7", "agentNode", x=-648, y=-158),
+            _node("8", "agentNode", x=500, y=-100),
+        ],
+        "edges": [],
+    }
+    new = {
+        "nodes": [
+            _node("1", "agentNode"),
+            _node("2", "agentNode"),
+        ],
+        "edges": [],
+    }
+    out = reconcile_positions(new, previous)
+    assert out["nodes"][0]["position"] == {"x": -648, "y": -158}
+    assert out["nodes"][1]["position"] == {"x": 500, "y": -100}
+
+
+def test_new_node_placed_relative_to_incoming_neighbor():
+    previous = {
+        "nodes": [_node("99", "startCall", name="greeting", x=100, y=200)],
+        "edges": [],
+    }
+    new = {
+        "nodes": [
+            _node("1", "startCall", name="greeting"),
+            _node("2", "agentNode", name="new_node"),
+        ],
+        "edges": [_edge("1", "2")],
+    }
+    out = reconcile_positions(new, previous)
+    # Start call keeps its previous position.
+    assert out["nodes"][0]["position"] == {"x": 100, "y": 200}
+    # New node offset from its incoming neighbor.
+    assert out["nodes"][1]["position"] == {"x": 500, "y": 400}
+
+
+def test_orphan_new_node_stays_at_origin():
+    new = {
+        "nodes": [_node("1", "agentNode", name="orphan")],
+        "edges": [],
+    }
+    out = reconcile_positions(new, None)
+    assert out["nodes"][0]["position"] == {"x": 0.0, "y": 0.0}
+
+
+def test_named_wins_over_unnamed_ordering():
+    previous = {
+        "nodes": [
+            _node("7", "agentNode", x=-648, y=-158),  # unnamed
+            _node("8", "agentNode", name="qualify", x=900, y=900),
+        ],
+        "edges": [],
+    }
+    new = {
+        "nodes": [
+            _node("1", "agentNode", name="qualify"),  # matches named
+            _node("2", "agentNode"),  # falls to unnamed queue
+        ],
+        "edges": [],
+    }
+    out = reconcile_positions(new, previous)
+    assert out["nodes"][0]["position"] == {"x": 900, "y": 900}
+    assert out["nodes"][1]["position"] == {"x": -648, "y": -158}
+
+
+def test_no_previous_keeps_origin_for_all_matched_positions():
+    new = {
+        "nodes": [
+            _node("1", "startCall", name="greeting"),
+            _node("2", "agentNode", name="reply"),
+        ],
+        "edges": [_edge("1", "2")],
+    }
+    out = reconcile_positions(new, None)
+    # No previous → first node stays at origin (no incoming), second
+    # node placed relative to its incoming neighbor at origin.
+    assert out["nodes"][0]["position"] == {"x": 0.0, "y": 0.0}
+    assert out["nodes"][1]["position"] == {"x": 400.0, "y": 200.0}
--- a/api/tests/test_mcp_save_workflow.py
+++ b/api/tests/test_mcp_save_workflow.py
@ -0,0 +1,225 @@
+"""Integration tests for the `save_workflow` MCP tool.
+
+Mocks `authenticate_mcp_request` and the db_client so tests don't need
+a live DB, but exercises the real TS validator subprocess end-to-end —
+parse is part of the contract the LLM relies on.
+
+Round-trip and pure-parser tests live in `test_ts_bridge.py`; this file
+focuses on the MCP tool's error-routing, version tagging, and DB-call
+shape.
+"""
+
+from __future__ import annotations
+
+import shutil
+from dataclasses import dataclass
+from unittest.mock import AsyncMock, MagicMock, patch
+
+import pytest
+from fastapi import HTTPException
+
+from api.mcp_server.tools.save_workflow import save_workflow
+
+pytestmark = pytest.mark.skipif(
+    shutil.which("node") is None, reason="node binary not available"
+)
+
+
+# ─── Fixtures & helpers ──────────────────────────────────────────────────
+
+
+@dataclass
+class _FakeDraft:
+    version_number: int = 2
+    status: str = "draft"
+
+
+class _FakeWorkflowModel:
+    id = 1
+    organization_id = 1
+    name = "test"
+    # reconcile_positions reads whichever of these holds the previous
+    # stored workflow JSON; None on all three is fine for a greenfield
+    # test and causes reconcile_positions to fall back to the placement
+    # heuristic for any new node.
+    current_definition = None
+    released_definition = None
+    workflow_definition = None
+
+
+@pytest.fixture
+def authed_user() -> MagicMock:
+    user = MagicMock()
+    user.selected_organization_id = 1
+    user.id = 1
+    return user
+
+
+@pytest.fixture
+def mock_backends(authed_user: MagicMock):
+    save_mock = AsyncMock(return_value=_FakeDraft())
+    update_mock = AsyncMock(return_value=_FakeWorkflowModel())
+    with (
+        patch(
+            "api.mcp_server.tools.save_workflow.authenticate_mcp_request",
+            AsyncMock(return_value=authed_user),
+        ),
+        patch(
+            "api.mcp_server.tools.save_workflow.db_client.get_workflow",
+            AsyncMock(return_value=_FakeWorkflowModel()),
+        ),
+        patch(
+            "api.mcp_server.tools.save_workflow.db_client.save_workflow_draft",
+            save_mock,
+        ),
+        patch(
+            "api.mcp_server.tools.save_workflow.db_client.update_workflow",
+            update_mock,
+        ),
+        patch(
+            "api.mcp_server.tools.save_workflow.db_client.get_draft_version",
+            AsyncMock(return_value=None),
+        ),
+    ):
+        yield save_mock, update_mock
+
+
+def _valid_code(name: str = "tool-test") -> str:
+    return f'''import {{ Workflow }} from "@dograh/sdk";
+import {{ startCall, endCall }} from "@dograh/sdk/typed";
+
+const wf = new Workflow({{ name: "{name}" }});
+
+const greeting = wf.addTyped(startCall({{ name: "greeting", prompt: "Hi!" }}));
+const done     = wf.addTyped(endCall({{ name: "done", prompt: "Bye." }}));
+
+wf.edge(greeting, done, {{ label: "done", condition: "conversation complete" }});
+'''
+
+
+# ─── Happy path ──────────────────────────────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_happy_path_saves_draft(mock_backends):
+    save_mock, update_mock = mock_backends
+    # Match the stored name so the rename branch stays dormant here.
+    result = await save_workflow(
+        workflow_id=1, code=_valid_code(name=_FakeWorkflowModel.name)
+    )
+    assert result["saved"] is True
+    assert result["workflow_id"] == 1
+    assert result["version_number"] == 2
+    assert result["status"] == "draft"
+    assert result["node_count"] == 2
+    assert result["edge_count"] == 1
+    assert result["renamed"] is False
+    assert result["name"] == _FakeWorkflowModel.name
+    save_mock.assert_awaited_once()
+    update_mock.assert_not_awaited()
+    payload = save_mock.call_args.kwargs["workflow_definition"]
+    assert len(payload["nodes"]) == 2
+    assert len(payload["edges"]) == 1
+
+
+@pytest.mark.asyncio
+async def test_rename_propagates_to_update_workflow(mock_backends):
+    save_mock, update_mock = mock_backends
+    result = await save_workflow(workflow_id=1, code=_valid_code(name="renamed"))
+    assert result["saved"] is True
+    assert result["renamed"] is True
+    assert result["name"] == "renamed"
+    update_mock.assert_awaited_once()
+    kwargs = update_mock.call_args.kwargs
+    assert kwargs["workflow_id"] == 1
+    assert kwargs["name"] == "renamed"
+    assert kwargs["workflow_definition"] is None
+    assert kwargs["organization_id"] == 1
+    save_mock.assert_awaited_once()
+
+
+# ─── Parse-stage rejections ──────────────────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_parser_rejects_disallowed_top_level(mock_backends):
+    save_mock, update_mock = mock_backends
+    code = _valid_code() + "function evil() { return 1; }\n"
+    result = await save_workflow(workflow_id=1, code=code)
+    assert result["saved"] is False
+    assert result["error_code"] == "parse_error"
+    save_mock.assert_not_awaited()
+    update_mock.assert_not_awaited()
+
+
+@pytest.mark.asyncio
+async def test_parser_rejects_unknown_factory(mock_backends):
+    save_mock, update_mock = mock_backends
+    code = """import { Workflow } from "@dograh/sdk";
+const wf = new Workflow({ name: "x" });
+const n = wf.addTyped(fakeNode({ name: "x", prompt: "y" }));
+"""
+    result = await save_workflow(workflow_id=1, code=code)
+    assert result["saved"] is False
+    assert result["error_code"] == "parse_error"
+    assert "Unknown node type" in result["error"]
+    save_mock.assert_not_awaited()
+    update_mock.assert_not_awaited()
+
+
+# ─── Validation-stage rejections ─────────────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_unknown_field_surfaces_validation_error(mock_backends):
+    save_mock, update_mock = mock_backends
+    code = """import { Workflow } from "@dograh/sdk";
+import { startCall } from "@dograh/sdk/typed";
+const wf = new Workflow({ name: "x" });
+const n = wf.addTyped(startCall({ name: "g", prompt: "hi", promt: "typo" }));
+"""
+    result = await save_workflow(workflow_id=1, code=code)
+    assert result["saved"] is False
+    assert result["error_code"] == "validation_error"
+    assert "Unknown field" in result["error"]
+    save_mock.assert_not_awaited()
+    update_mock.assert_not_awaited()
+
+
+# ─── Graph-stage rejections ──────────────────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_graph_validation_catches_missing_start_node(mock_backends):
+    save_mock, update_mock = mock_backends
+    # Only an end node — WorkflowGraph requires exactly one start node.
+    code = """import { Workflow } from "@dograh/sdk";
+import { endCall } from "@dograh/sdk/typed";
+const wf = new Workflow({ name: "orphan" });
+const only = wf.addTyped(endCall({ name: "only", prompt: "bye" }));
+"""
+    result = await save_workflow(workflow_id=1, code=code)
+    assert result["saved"] is False
+    assert result["error_code"] == "graph_validation"
+    save_mock.assert_not_awaited()
+    update_mock.assert_not_awaited()
+
+
+# ─── Workflow not found / unauthorized ───────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_unknown_workflow_raises_404(authed_user: MagicMock):
+    with (
+        patch(
+            "api.mcp_server.tools.save_workflow.authenticate_mcp_request",
+            AsyncMock(return_value=authed_user),
+        ),
+        patch(
+            "api.mcp_server.tools.save_workflow.db_client.get_workflow",
+            AsyncMock(return_value=None),
+        ),
+    ):
+        with pytest.raises(HTTPException) as exc_info:
+            await save_workflow(workflow_id=999, code=_valid_code())
+        assert exc_info.value.status_code == 404
--- a/api/tests/test_node_specs.py
+++ b/api/tests/test_node_specs.py
@ -0,0 +1,196 @@
+"""Spec-quality lint.
+
+Catches drift between NodeSpecs and the rest of the system before it lands:
+- Placeholder/empty descriptions
+- Missing examples
+- display_options referencing fields that don't exist
+- Examples that don't validate against the per-type Pydantic DTO
+- Spec name not matching a discriminator value in dto.py
+"""
+
+from __future__ import annotations
+
+import re
+
+import pytest
+
+from api.services.workflow.dto import NodeType, ReactFlowDTO
+from api.services.workflow.node_specs import (
+    NodeSpec,
+    PropertySpec,
+    PropertyType,
+    all_specs,
+)
+
+PLACEHOLDER_DESCRIPTION_PATTERN = re.compile(
+    r"^\s*(todo|fixme|tbd|xxx|\.\.\.|placeholder|description|n/?a|\?)\s*\.?\s*$",
+    re.IGNORECASE,
+)
+
+
+def _walk_properties(props: list[PropertySpec], path: str = ""):
+    """Yield (full_path, property) for every property and nested sub-property."""
+    for prop in props:
+        full_path = f"{path}.{prop.name}" if path else prop.name
+        yield full_path, prop
+        if prop.properties:
+            yield from _walk_properties(prop.properties, full_path)
+
+
+# ─────────────────────────────────────────────────────────────────────────
+# Lint
+# ─────────────────────────────────────────────────────────────────────────
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_node_spec_has_non_placeholder_description(spec: NodeSpec):
+    assert spec.description.strip(), f"{spec.name}: empty description"
+    assert not PLACEHOLDER_DESCRIPTION_PATTERN.match(spec.description), (
+        f"{spec.name}: description looks like a placeholder: {spec.description!r}"
+    )
+    assert len(spec.description) >= 20, (
+        f"{spec.name}: description too short to be useful for an LLM "
+        f"({len(spec.description)} chars)"
+    )
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_node_spec_has_at_least_one_example(spec: NodeSpec):
+    assert spec.examples, (
+        f"{spec.name}: must have at least one NodeExample so LLMs have a "
+        f"realistic shape to pattern-match."
+    )
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_property_descriptions_non_placeholder(spec: NodeSpec):
+    for path, prop in _walk_properties(spec.properties):
+        assert prop.description.strip(), f"{spec.name}.{path}: empty description"
+        assert not PLACEHOLDER_DESCRIPTION_PATTERN.match(prop.description), (
+            f"{spec.name}.{path}: description looks like a placeholder: "
+            f"{prop.description!r}"
+        )
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_display_options_reference_real_fields(spec: NodeSpec):
+    """A property's display_options must only reference sibling property
+    names. Nested properties are scoped to their parent's siblings."""
+
+    def _check(scope_props: list[PropertySpec], scope_path: str = ""):
+        names_in_scope = {p.name for p in scope_props}
+        for prop in scope_props:
+            current_path = f"{scope_path}.{prop.name}" if scope_path else prop.name
+            if prop.display_options:
+                refs = set((prop.display_options.show or {}).keys()) | set(
+                    (prop.display_options.hide or {}).keys()
+                )
+                missing = refs - names_in_scope
+                assert not missing, (
+                    f"{spec.name}.{current_path}: display_options references "
+                    f"unknown sibling fields: {sorted(missing)}"
+                )
+            if prop.properties:
+                _check(prop.properties, current_path)
+
+    _check(spec.properties)
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_options_properties_have_options(spec: NodeSpec):
+    for path, prop in _walk_properties(spec.properties):
+        if prop.type in (PropertyType.options, PropertyType.multi_options):
+            assert prop.options, (
+                f"{spec.name}.{path}: type={prop.type.value} requires at "
+                f"least one PropertyOption."
+            )
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_fixed_collection_has_sub_properties(spec: NodeSpec):
+    for path, prop in _walk_properties(spec.properties):
+        if prop.type == PropertyType.fixed_collection:
+            assert prop.properties, (
+                f"{spec.name}.{path}: fixed_collection requires nested "
+                f"`properties` describing each row."
+            )
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_spec_name_matches_dto_discriminator(spec: NodeSpec):
+    valid_names = {t.value for t in NodeType}
+    assert spec.name in valid_names, (
+        f"NodeSpec {spec.name!r} doesn't match any NodeType discriminator. "
+        f"Valid: {sorted(valid_names)}"
+    )
+
+
+@pytest.mark.parametrize("spec", all_specs(), ids=lambda s: s.name)
+def test_examples_validate_against_dto(spec: NodeSpec):
+    """Each NodeExample.data must pass per-type DTO validation. This stops
+    examples from drifting away from the actual wire schema."""
+    for ex in spec.examples:
+        wire_node = {
+            "id": "example",
+            "type": spec.name,
+            "position": {"x": 0, "y": 0},
+            "data": ex.data,
+        }
+        # Build a minimal valid graph: example node plus a synthetic peer if
+        # graph_constraints require an incoming or outgoing edge.
+        nodes = [wire_node]
+        edges: list[dict] = []
+        constraints = spec.graph_constraints
+
+        if constraints and (constraints.min_outgoing or 0) > 0:
+            nodes.append(
+                {
+                    "id": "downstream",
+                    "type": "endCall",
+                    "position": {"x": 0, "y": 0},
+                    "data": {"name": "End", "prompt": "End", "is_end": True},
+                }
+            )
+            edges.append(
+                {
+                    "id": "e_out",
+                    "source": "example",
+                    "target": "downstream",
+                    "data": {"label": "next", "condition": "next"},
+                }
+            )
+
+        if constraints and (constraints.min_incoming or 0) > 0:
+            nodes.append(
+                {
+                    "id": "upstream",
+                    "type": "startCall",
+                    "position": {"x": 0, "y": 0},
+                    "data": {
+                        "name": "Start",
+                        "prompt": "Hello",
+                        "is_start": True,
+                    },
+                }
+            )
+            edges.append(
+                {
+                    "id": "e_in",
+                    "source": "upstream",
+                    "target": "example",
+                    "data": {"label": "in", "condition": "in"},
+                }
+            )
+
+        # Validate. If this raises, the example is broken.
+        ReactFlowDTO.model_validate({"nodes": nodes, "edges": edges})
+
+
+def test_all_dto_types_have_specs():
+    """Every NodeType discriminator value must have a registered NodeSpec —
+    catches the case where someone adds a new node type to dto.py but
+    forgets to author a spec."""
+    spec_names = {s.name for s in all_specs()}
+    type_values = {t.value for t in NodeType}
+    missing = type_values - spec_names
+    assert not missing, f"NodeType discriminators without specs: {sorted(missing)}"
--- a/api/tests/test_pipecat_engine_end_call.py
+++ b/api/tests/test_pipecat_engine_end_call.py
@ -27,12 +27,13 @@ import pytest
 from api.enums import ToolCategory
 from api.services.workflow.dto import (
    EdgeDataDTO,
-    NodeDataDTO,
-    NodeType,
+    EndCallNodeData,
+    EndCallRFNode,
    Position,
    ReactFlowDTO,
    RFEdgeDTO,
-    RFNodeDTO,
+    StartCallNodeData,
+    StartCallRFNode,
 )
 from api.services.workflow.pipecat_engine import PipecatEngine
 from api.services.workflow.pipecat_engine_custom_tools import CustomToolManager
@ -1013,11 +1014,10 @@ class TestEndCallExtractionBehavior:
        # Create a workflow where start node has NO extraction
        dto = ReactFlowDTO(
            nodes=[
-                RFNodeDTO(
+                StartCallRFNode(
                    id="start",
-                    type=NodeType.startNode,
                    position=Position(x=0, y=0),
-                    data=NodeDataDTO(
+                    data=StartCallNodeData(
                        name="Start Call",
                        prompt=START_CALL_SYSTEM_PROMPT,
                        is_start=True,
@ -1026,11 +1026,10 @@ class TestEndCallExtractionBehavior:
                        extraction_enabled=False,  # No extraction
                    ),
                ),
-                RFNodeDTO(
+                EndCallRFNode(
                    id="end",
-                    type=NodeType.endNode,
                    position=Position(x=0, y=200),
-                    data=NodeDataDTO(
+                    data=EndCallNodeData(
                        name="End Call",
                        prompt=END_CALL_SYSTEM_PROMPT,
                        is_end=True,
--- a/api/tests/test_sdk_sync.py
+++ b/api/tests/test_sdk_sync.py
@ -0,0 +1,99 @@
+"""Drift guard: committed SDK typed files must match what codegen
+produces from the current `node_specs/` registry.
+
+Fails loudly if a spec was edited without running
+`./scripts/generate_sdk.sh`. CI also runs the full script and asserts
+an empty `git diff` as the authoritative cross-language check; this
+test is the fast local feedback loop inside pytest.
+"""
+
+from __future__ import annotations
+
+import json
+import shutil
+import subprocess
+import sys
+from pathlib import Path
+
+import pytest
+
+# Ensure the Python SDK package is importable without requiring a
+# `pip install -e sdk/python`. The codegen lives there because it ships
+# with the SDK wheel, but tests need to reach it directly.
+REPO_ROOT = Path(__file__).resolve().parents[2]
+SDK_PY_SRC = REPO_ROOT / "sdk" / "python" / "src"
+if str(SDK_PY_SRC) not in sys.path:
+    sys.path.insert(0, str(SDK_PY_SRC))
+
+from dograh_sdk.codegen import generate_all  # noqa: E402
+
+from api.services.workflow.node_specs import SPEC_VERSION, all_specs  # noqa: E402
+
+PY_OUT = REPO_ROOT / "sdk" / "python" / "src" / "dograh_sdk" / "typed"
+TS_OUT = REPO_ROOT / "sdk" / "typescript" / "src" / "typed"
+TS_CODEGEN = REPO_ROOT / "sdk" / "typescript" / "scripts" / "codegen.mts"
+REGEN_HINT = "Run ./scripts/generate_sdk.sh to regenerate."
+
+
+def _specs_payload() -> dict:
+    return {
+        "spec_version": SPEC_VERSION,
+        "node_types": [s.model_dump(mode="json") for s in all_specs()],
+    }
+
+
+def _compare_trees(expected_dir: Path, actual_dir: Path, *, skip: set[str]) -> None:
+    def tree(d: Path) -> dict[str, str]:
+        return {
+            p.name: p.read_text()
+            for p in d.iterdir()
+            if p.is_file() and p.name not in skip
+        }
+
+    expected = tree(expected_dir)
+    actual = tree(actual_dir)
+
+    if expected.keys() != actual.keys():
+        pytest.fail(
+            f"File set differs in {expected_dir.name}/.\n"
+            f"  committed: {sorted(expected)}\n"
+            f"  generated: {sorted(actual)}\n"
+            f"{REGEN_HINT}"
+        )
+    for name in sorted(expected):
+        if expected[name] != actual[name]:
+            pytest.fail(
+                f"{expected_dir.name}/{name} is out of sync with node_specs. "
+                f"{REGEN_HINT}"
+            )
+
+
+def test_python_sdk_typed_in_sync(tmp_path: Path) -> None:
+    specs = _specs_payload()["node_types"]
+    generate_all(specs, tmp_path)
+    # _base.py is hand-written and lives alongside generated files.
+    _compare_trees(PY_OUT, tmp_path, skip={"_base.py", "__pycache__"})
+
+
+@pytest.mark.skipif(shutil.which("node") is None, reason="node binary not available")
+def test_typescript_sdk_typed_in_sync(tmp_path: Path) -> None:
+    specs_file = tmp_path / "specs.json"
+    specs_file.write_text(json.dumps(_specs_payload()))
+    out = tmp_path / "ts_out"
+
+    result = subprocess.run(
+        [
+            "node",
+            str(TS_CODEGEN),
+            "--input",
+            str(specs_file),
+            "--out",
+            str(out),
+        ],
+        capture_output=True,
+        text=True,
+    )
+    assert result.returncode == 0, (
+        f"TS codegen failed:\nstdout: {result.stdout}\nstderr: {result.stderr}"
+    )
+    _compare_trees(TS_OUT, out, skip=set())
--- a/api/tests/test_text_and_audio_playback.py
+++ b/api/tests/test_text_and_audio_playback.py
@ -15,12 +15,13 @@ import pytest
 from api.services.pipecat.recording_audio_cache import RecordingAudio
 from api.services.workflow.dto import (
    EdgeDataDTO,
-    NodeDataDTO,
-    NodeType,
+    EndCallNodeData,
+    EndCallRFNode,
    Position,
    ReactFlowDTO,
    RFEdgeDTO,
-    RFNodeDTO,
+    StartCallNodeData,
+    StartCallRFNode,
 )
 from api.services.workflow.pipecat_engine import PipecatEngine
 from api.services.workflow.pipecat_engine_custom_tools import CustomToolManager
@ -64,11 +65,10 @@ def text_workflow() -> WorkflowGraph:
    """Start->End workflow with text greeting and text transition speech."""
    dto = ReactFlowDTO(
        nodes=[
-            RFNodeDTO(
+            StartCallRFNode(
                id="start",
-                type=NodeType.startNode,
                position=Position(x=0, y=0),
-                data=NodeDataDTO(
+                data=StartCallNodeData(
                    name="Start Call",
                    prompt=START_PROMPT,
                    is_start=True,
@ -79,11 +79,10 @@ def text_workflow() -> WorkflowGraph:
                    extraction_enabled=False,
                ),
            ),
-            RFNodeDTO(
+            EndCallRFNode(
                id="end",
-                type=NodeType.endNode,
                position=Position(x=0, y=200),
-                data=NodeDataDTO(
+                data=EndCallNodeData(
                    name="End Call",
                    prompt=END_PROMPT,
                    is_end=True,
@ -115,11 +114,10 @@ def audio_workflow() -> WorkflowGraph:
    """Start->End workflow with audio greeting and audio transition speech."""
    dto = ReactFlowDTO(
        nodes=[
-            RFNodeDTO(
+            StartCallRFNode(
                id="start",
-                type=NodeType.startNode,
                position=Position(x=0, y=0),
-                data=NodeDataDTO(
+                data=StartCallNodeData(
                    name="Start Call",
                    prompt=START_PROMPT,
                    is_start=True,
@ -130,11 +128,10 @@ def audio_workflow() -> WorkflowGraph:
                    extraction_enabled=False,
                ),
            ),
-            RFNodeDTO(
+            EndCallRFNode(
                id="end",
-                type=NodeType.endNode,
                position=Position(x=0, y=200),
-                data=NodeDataDTO(
+                data=EndCallNodeData(
                    name="End Call",
                    prompt=END_PROMPT,
                    is_end=True,
@ -293,11 +290,10 @@ class TestStartGreeting:
        """No greeting configured should return None."""
        dto = ReactFlowDTO(
            nodes=[
-                RFNodeDTO(
+                StartCallRFNode(
                    id="start",
-                    type=NodeType.startNode,
                    position=Position(x=0, y=0),
-                    data=NodeDataDTO(
+                    data=StartCallNodeData(
                        name="Start",
                        prompt="Prompt",
                        is_start=True,
@ -305,11 +301,10 @@ class TestStartGreeting:
                        extraction_enabled=False,
                    ),
                ),
-                RFNodeDTO(
+                EndCallRFNode(
                    id="end",
-                    type=NodeType.endNode,
                    position=Position(x=0, y=200),
-                    data=NodeDataDTO(
+                    data=EndCallNodeData(
                        name="End",
                        prompt="End",
                        is_end=True,
@ -338,11 +333,10 @@ class TestStartGreeting:
        """Text greeting with {{variable}} placeholders should be rendered."""
        dto = ReactFlowDTO(
            nodes=[
-                RFNodeDTO(
+                StartCallRFNode(
                    id="start",
-                    type=NodeType.startNode,
                    position=Position(x=0, y=0),
-                    data=NodeDataDTO(
+                    data=StartCallNodeData(
                        name="Start",
                        prompt="Prompt",
                        is_start=True,
@ -352,11 +346,10 @@ class TestStartGreeting:
                        extraction_enabled=False,
                    ),
                ),
-                RFNodeDTO(
+                EndCallRFNode(
                    id="end",
-                    type=NodeType.endNode,
                    position=Position(x=0, y=200),
-                    data=NodeDataDTO(
+                    data=EndCallNodeData(
                        name="End",
                        prompt="End",
                        is_end=True,
--- a/api/tests/test_ts_bridge.py
+++ b/api/tests/test_ts_bridge.py
@ -0,0 +1,275 @@
+"""End-to-end tests for the Node TS validator bridge.
+
+Exercises the real `node` subprocess — slow-ish but the whole point is
+that code → JSON and JSON → code round-trip losslessly.
+"""
+
+from __future__ import annotations
+
+import shutil
+
+import pytest
+
+from api.mcp_server.ts_bridge import TsBridgeError, generate_code, parse_code
+
+pytestmark = pytest.mark.skipif(
+    shutil.which("node") is None, reason="node binary not available"
+)
+
+
+def _minimal_workflow() -> dict:
+    """Start → End, one edge. Stored shape matches ReactFlowDTO."""
+    return {
+        "nodes": [
+            {
+                "id": "1",
+                "type": "startCall",
+                "position": {"x": 0, "y": 0},
+                "data": {
+                    "name": "Greeting",
+                    "prompt": "Greet warmly.",
+                    "greeting_type": "text",
+                    "greeting": "Hi {{first_name}}!",
+                    "allow_interrupt": True,
+                },
+            },
+            {
+                "id": "2",
+                "type": "endCall",
+                "position": {"x": 200, "y": 0},
+                "data": {"name": "Done", "prompt": "Say goodbye."},
+            },
+        ],
+        "edges": [
+            {
+                "id": "1-2",
+                "source": "1",
+                "target": "2",
+                "data": {"label": "done", "condition": "conversation complete"},
+            },
+        ],
+        "viewport": {"x": 0, "y": 0, "zoom": 1},
+    }
+
+
+def _normalize(wf: dict) -> dict:
+    """Strip cosmetics before comparing a round-tripped workflow.
+
+    Node IDs are regenerated deterministically by the parser
+    (1, 2, 3, ...) so the inputs already match if constructed that way.
+    Position is preserved. Edge ids follow `source-target`.
+    """
+    return {
+        "nodes": [
+            {
+                "id": n["id"],
+                "type": n["type"],
+                "position": n["position"],
+                "data": n["data"],
+            }
+            for n in wf["nodes"]
+        ],
+        "edges": [
+            {
+                "id": e["id"],
+                "source": e["source"],
+                "target": e["target"],
+                "data": e["data"],
+            }
+            for e in wf["edges"]
+        ],
+    }
+
+
+# ─── generate_code ───────────────────────────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_generate_emits_imports_and_factories():
+    code = await generate_code(_minimal_workflow(), workflow_name="test")
+    assert 'import { Workflow } from "@dograh/sdk";' in code
+    assert "startCall" in code
+    assert "endCall" in code
+    assert "wf.addTyped(startCall(" in code
+    assert "wf.edge(" in code
+
+
+@pytest.mark.asyncio
+async def test_generate_strips_spec_defaults():
+    wf = _minimal_workflow()
+    code = await generate_code(wf)
+    # `add_global_prompt=True` is a spec default for startCall; emitted
+    # code should omit it. Keeps the LLM-facing projection tight.
+    assert "add_global_prompt" not in code
+
+
+@pytest.mark.asyncio
+async def test_generate_omits_position():
+    """Positions are hidden from the LLM — auto-layout post-processing
+    (future) reassigns them on save. Keeping them out of the edit
+    surface avoids the LLM producing cramped/overlapping layouts."""
+    wf = _minimal_workflow()
+    code = await generate_code(wf)
+    assert "position" not in code
+
+
+@pytest.mark.asyncio
+async def test_generate_strips_legacy_ui_state_fields():
+    """Stored workflows from before spec validation carry UI-state fields
+    (`invalid`, `selected`, `is_start`, etc.). `get_workflow_code` hides
+    those from the LLM so edits don't round-trip the noise."""
+    wf = {
+        "nodes": [
+            {
+                "id": "1",
+                "type": "startCall",
+                "position": {"x": 0, "y": 0},
+                "data": {
+                    "name": "g",
+                    "prompt": "hi",
+                    "invalid": False,
+                    "validationMessage": None,
+                    "is_start": True,
+                    "selected": True,
+                    "dragging": False,
+                },
+            },
+        ],
+        "edges": [],
+        "viewport": {"x": 0, "y": 0, "zoom": 1},
+    }
+    code = await generate_code(wf)
+    for dropped in ("invalid", "validationMessage", "is_start", "selected", "dragging"):
+        assert dropped not in code, f"{dropped} should be stripped"
+    assert 'prompt: "hi"' in code
+
+
+@pytest.mark.asyncio
+async def test_generate_strips_unknown_edge_fields():
+    wf = _minimal_workflow()
+    wf["edges"][0]["data"]["invalid"] = False
+    wf["edges"][0]["data"]["validationMessage"] = None
+    code = await generate_code(wf)
+    assert "invalid" not in code
+    assert "validationMessage" not in code
+
+
+# ─── parse_code ──────────────────────────────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_parse_accepts_minimal_code():
+    code = """import { Workflow } from "@dograh/sdk";
+import { startCall, endCall } from "@dograh/sdk/typed";
+
+const wf = new Workflow({ name: "min" });
+const a = wf.addTyped(startCall({ name: "g", prompt: "hi" }));
+const b = wf.addTyped(endCall({ name: "d", prompt: "bye" }));
+wf.edge(a, b, { label: "done", condition: "wrapped" });
+"""
+    result = await parse_code(code)
+    assert result["ok"] is True
+    wf = result["workflow"]
+    assert len(wf["nodes"]) == 2
+    assert len(wf["edges"]) == 1
+    assert wf["nodes"][0]["type"] == "startCall"
+    assert wf["edges"][0]["source"] == wf["nodes"][0]["id"]
+
+
+@pytest.mark.asyncio
+async def test_parse_rejects_function_declaration():
+    code = """import { Workflow } from "@dograh/sdk";
+const wf = new Workflow({ name: "x" });
+function evil() { return 1; }
+"""
+    result = await parse_code(code)
+    assert result["ok"] is False
+    assert result["stage"] == "parse"
+    assert any("FunctionDeclaration" in e["message"] for e in result["errors"])
+
+
+@pytest.mark.asyncio
+async def test_parse_rejects_unknown_field():
+    code = """import { Workflow } from "@dograh/sdk";
+import { startCall } from "@dograh/sdk/typed";
+const wf = new Workflow({ name: "x" });
+const a = wf.addTyped(startCall({ name: "g", prompt: "hi", promt: "typo" }));
+"""
+    result = await parse_code(code)
+    assert result["ok"] is False
+    assert result["stage"] == "validate"
+    assert any("Unknown field" in e["message"] for e in result["errors"])
+
+
+@pytest.mark.asyncio
+async def test_parse_rejects_unknown_variable_in_edge():
+    code = """import { Workflow } from "@dograh/sdk";
+import { startCall, endCall } from "@dograh/sdk/typed";
+const wf = new Workflow({ name: "x" });
+const a = wf.addTyped(startCall({ name: "g", prompt: "hi" }));
+wf.edge(a, missing, { label: "done", condition: "c" });
+"""
+    result = await parse_code(code)
+    assert result["ok"] is False
+    assert result["stage"] == "parse"
+    assert any("Unknown node variable" in e["message"] for e in result["errors"])
+
+
+@pytest.mark.asyncio
+async def test_parse_requires_label_and_condition_on_edge():
+    code = """import { Workflow } from "@dograh/sdk";
+import { startCall, endCall } from "@dograh/sdk/typed";
+const wf = new Workflow({ name: "x" });
+const a = wf.addTyped(startCall({ name: "g", prompt: "hi" }));
+const b = wf.addTyped(endCall({ name: "d", prompt: "bye" }));
+wf.edge(a, b, { label: "", condition: "c" });
+"""
+    result = await parse_code(code)
+    assert result["ok"] is False
+    assert result["stage"] == "parse"
+
+
+# ─── Round-trip ──────────────────────────────────────────────────────────
+
+
+@pytest.mark.asyncio
+async def test_round_trip_minimal():
+    wf = _minimal_workflow()
+    code = await generate_code(wf, workflow_name="rt")
+    result = await parse_code(code)
+    assert result["ok"] is True, result
+    # Positions are intentionally not preserved — they'll be reassigned
+    # by a downstream auto-layout pass. Parser defaults to {0, 0}.
+    for in_node, out_node in zip(wf["nodes"], result["workflow"]["nodes"]):
+        assert out_node["type"] == in_node["type"]
+        assert out_node["position"] == {"x": 0, "y": 0}
+        for k, v in in_node["data"].items():
+            assert out_node["data"][k] == v, (
+                f"{k}: {out_node['data'].get(k)!r} != {v!r}"
+            )
+    assert _normalize({"nodes": [], "edges": result["workflow"]["edges"]})["edges"] == [
+        {
+            "id": "1-2",
+            "source": "1",
+            "target": "2",
+            "data": {"label": "done", "condition": "conversation complete"},
+        }
+    ]
+
+
+@pytest.mark.asyncio
+async def test_generate_fails_on_unknown_type():
+    bad = {
+        "nodes": [
+            {
+                "id": "1",
+                "type": "doesNotExist",
+                "position": {"x": 0, "y": 0},
+                "data": {},
+            }
+        ],
+        "edges": [],
+        "viewport": {"x": 0, "y": 0, "zoom": 1},
+    }
+    with pytest.raises(TsBridgeError, match="Unknown node type"):
+        await generate_code(bad)
--- a/docs/docs.json
+++ b/docs/docs.json
@ -107,6 +107,7 @@
          },
          {
            "group": "Integrations",
+            "tag": "NEW",
            "pages": [
              "integrations/mcp"
            ]
@ -125,6 +126,15 @@
              "developer/environment-variables"
            ]
          },
+          {
+            "group": "SDKs",
+            "tag": "NEW",
+            "pages": [
+              "sdks/introduction",
+              "sdks/build-an-agent",
+              "sdks/outbound-calls"
+            ]
+          },
          {
            "group": "Deployment",
            "pages": [
@ -243,7 +253,7 @@
    }
  },
  "banner": {
-    "content": "🎉 **New: Gemini Live 3.1 Support** — Try the latest Google Gemini Live 3.1 on Dograh platform. [Learn more →](/configurations/inference-providers#gemini-3-1-live)",
+    "content": "🎉 **New: MCP Server & SDKs Released** — Drive Dograh from Claude, Cursor, or your own Python/TypeScript code. [MCP →](/integrations/mcp) · [SDKs →](/sdks/introduction)",
    "dismissible": true
  },
  "search": {
--- a/docs/integrations/mcp.mdx
+++ b/docs/integrations/mcp.mdx
@ -16,6 +16,16 @@ Dograh exposes an [MCP (Model Context Protocol)](https://modelcontextprotocol.io

 The endpoint is also shown in **Platform Settings → MCP Server** inside the Dograh UI.

+<Note>
+If you deployed Dograh to a remote server using [`setup_remote.sh`](/deployment/docker#option-2%3A-remote-server-deployment), your endpoint is served with a self-signed SSL certificate. Claude Code will refuse MCP connections to it unless you start the CLI with TLS verification disabled:
+
+```bash
+NODE_TLS_REJECT_UNAUTHORIZED=0 claude
+```
+
+This is only required for self-signed certificates. If you have set up a [custom domain](/deployment/custom-domain) with Let's Encrypt certificates via Certbot, no extra flag is needed.
+</Note>
+
 ## Claude Code

 Register Dograh as an MCP server with the Claude Code CLI:
@ -56,14 +66,33 @@ Restart Claude Desktop after saving. The Dograh tools should appear in the tool

 Any MCP client that supports Streamable HTTP transport can connect with the same URL and header. Paste the configuration above into your client's MCP settings file and replace `YOUR_API_KEY`.

-## Available tools
+## Example prompts

-Once connected, your AI assistant can:
+Once the MCP server is connected, you can drive Dograh from your coding agent in plain English. A few prompts to try:

- `list_workflows` — list agents in your workspace
- `get_workflow` — fetch an agent's definition by ID
- `search_dograh_docs` — search Dograh documentation
- `fetch_dograh_doc` — retrieve a specific doc page
+**Explore your workspace**
+
+- "List my agents in Dograh."
+- "Show me the definition of the agent called *Lead Qualifier*."
+- "Which credentials and tools are configured in my Dograh workspace?"
+- "List the recordings from my most recent agent."
+
+**Edit an agent**
+
+- "In my *Lead Qualifier* agent, add a new agent node after the greeting that asks the caller for their budget, then routes to the existing qualification node."
+- "Add an end-call node to *Support Bot* that triggers when the user says they are done, with a polite goodbye prompt."
+- "Rename the *intro* node in *Lead Qualifier* to *greeting* and update any edges that reference it."
+- "Change the LLM model on all agent nodes in *Support Bot* to `gpt-4o-mini`."
+
+**Learn the platform**
+
+- "Search the Dograh docs for how to configure a TURN server."
+- "What node types does Dograh support, and what fields does a `knowledge_base` node take?"
+- "How do I deploy Dograh on a custom domain with HTTPS?"
+
+<Note>
+Agent edits are saved as a new **draft** version — your published agent keeps serving calls until you explicitly publish the draft from the Dograh UI.
+</Note>

 <Note>
 The API key controls which workspace the assistant sees. Treat it like any other credential — do not commit it to source control or paste it into shared chats.
--- a/docs/sdks/build-an-agent.mdx
+++ b/docs/sdks/build-an-agent.mdx
@ -0,0 +1,111 @@
+---
+title: "Build an agent"
+description: "Assemble a Dograh voice agent programmatically with the SDK and save it as a draft"
+---
+
+The SDK mirrors the node-and-edge model of the [Voice Agent Builder](/voice-agent/introduction). You create a `Workflow`, add nodes (`startCall`, `agentNode`, `endCall`, …) with `add()`, connect them with `edge()`, and persist the result via `save_workflow`.
+
+## Prerequisites
+
+- A Dograh [API key](/configurations/api-keys) exported as `DOGRAH_API_KEY`
+- An existing agent ID to save drafts against (create one in the Dograh UI or via [`POST /api/v1/workflow/create`](/api-reference/agents/create-from-template))
+
+## Build and save
+
+The example below builds a three-node loan-qualification agent and saves it as a **new draft version** on an existing agent. Your published agent keeps serving calls until you explicitly publish the draft.
+
+<CodeGroup>
+```python Python
+from dograh_sdk import DograhClient, Workflow
+
+with DograhClient(api_key="YOUR_API_KEY") as client:
+    wf = Workflow(client=client, name="loan_qualification")
+
+    greeting = wf.add(
+        type="startCall",
+        name="greeting",
+        prompt="You are Sarah from Acme Loans. Greet the caller warmly.",
+    )
+    qualify = wf.add(
+        type="agentNode",
+        name="qualify",
+        prompt="Ask about loan amount, purpose, and monthly income.",
+    )
+    done = wf.add(
+        type="endCall",
+        name="done",
+        prompt="Thank them and end the call politely.",
+    )
+
+    wf.edge(greeting, qualify, label="interested", condition="Caller wants to continue.")
+    wf.edge(qualify, done, label="done", condition="All qualification questions answered.")
+
+    client.save_workflow(workflow_id=123, workflow=wf)
+```
+```typescript TypeScript
+import { DograhClient, Workflow } from "@dograh/sdk";
+
+const client = new DograhClient({ apiKey: "YOUR_API_KEY" });
+const wf = new Workflow({ client, name: "loan_qualification" });
+
+const greeting = await wf.add({
+    type: "startCall",
+    name: "greeting",
+    prompt: "You are Sarah from Acme Loans. Greet the caller warmly.",
+});
+const qualify = await wf.add({
+    type: "agentNode",
+    name: "qualify",
+    prompt: "Ask about loan amount, purpose, and monthly income.",
+});
+const done = await wf.add({
+    type: "endCall",
+    name: "done",
+    prompt: "Thank them and end the call politely.",
+});
+
+wf.edge(greeting, qualify, { label: "interested", condition: "Caller wants to continue." });
+wf.edge(qualify, done, { label: "done", condition: "All qualification questions answered." });
+
+await client.saveWorkflow(123, wf);
+```
+</CodeGroup>
+
+## Edit an existing agent
+
+Load an agent into an editable `Workflow`, mutate it, then save:
+
+<CodeGroup>
+```python Python
+wf = client.load_workflow(workflow_id=123)
+wf.name = "loan_qualification_v2"
+client.save_workflow(workflow_id=123, workflow=wf)
+```
+```typescript TypeScript
+const wf = await client.loadWorkflow(123);
+wf.name = "loan_qualification_v2";
+await client.saveWorkflow(123, wf);
+```
+</CodeGroup>
+
+## Discover node types
+
+Each node's `type` string and required fields come from the backend's node-spec catalog. Fetch it at runtime to validate what you can build:
+
+<CodeGroup>
+```python Python
+types = client.list_node_types()
+for spec in types.node_types:
+    print(spec.name, [p.name for p in spec.properties])
+```
+```typescript TypeScript
+const types = await client.listNodeTypes();
+for (const spec of types.node_types) {
+    console.log(spec.name, spec.properties.map(p => p.name));
+}
+```
+</CodeGroup>
+
+<Note>
+For a full description of each node type and its fields, see the [Nodes](/voice-agent/start-call) section of the Voice Agent Builder docs.
+</Note>
--- a/docs/sdks/introduction.mdx
+++ b/docs/sdks/introduction.mdx
@ -0,0 +1,75 @@
+---
+title: "Introduction"
+description: "Build and operate Dograh voice AI agents programmatically from Python or TypeScript"
+---
+
+Dograh ships official SDKs for **Python** and **TypeScript** that wrap the Dograh REST API and the workflow builder. Use them to create or edit agents, place outbound calls, and inspect runs from your own code.
+
+- **Python** — [`dograh-sdk`](https://pypi.org/project/dograh-sdk/) on PyPI
+- **TypeScript** — [`@dograh/sdk`](https://www.npmjs.com/package/@dograh/sdk) on npm
+
+Both packages are generated from the same backend OpenAPI spec, so the method surface is equivalent — only the naming convention differs (`snake_case` in Python, `camelCase` in TypeScript).
+
+## Install
+
+<CodeGroup>
+```bash Python
+pip install dograh-sdk
+```
+```bash TypeScript
+npm install @dograh/sdk
+```
+</CodeGroup>
+
+## Authenticate
+
+Generate an API key at [`/api-keys`](https://app.dograh.com/api-keys) (or `http://localhost:3010/api-keys` for self-hosted). See [API Keys](/configurations/api-keys) for details.
+
+Both SDKs read the API key from the `DOGRAH_API_KEY` environment variable by default, and the base URL from `DOGRAH_API_URL` (defaults to `http://localhost:8000`). You can also pass them explicitly.
+
+<CodeGroup>
+```python Python
+from dograh_sdk import DograhClient
+
+client = DograhClient(
+    base_url="https://app.dograh.com",
+    api_key="YOUR_API_KEY",
+)
+```
+```typescript TypeScript
+import { DograhClient } from "@dograh/sdk";
+
+const client = new DograhClient({
+    baseUrl: "https://app.dograh.com",
+    apiKey: "YOUR_API_KEY",
+});
+```
+</CodeGroup>
+
+<Note>
+For self-hosted deployments, swap `baseUrl` for your backend URL (e.g. `http://localhost:8000`).
+</Note>
+
+## Quick tour
+
+List the agents in your workspace:
+
+<CodeGroup>
+```python Python
+workflows = client.list_workflows()
+for wf in workflows:
+    print(wf.id, wf.name)
+```
+```typescript TypeScript
+const workflows = await client.listWorkflows();
+for (const wf of workflows) {
+    console.log(wf.id, wf.name);
+}
+```
+</CodeGroup>
+
+## Next steps
+
+- [Build an agent](/sdks/build-an-agent) — assemble nodes and edges, save as a draft
+- [Place an outbound call](/sdks/outbound-calls) — trigger a call from an agent to a phone number
+- [MCP Server](/integrations/mcp) — let Claude and other coding agents drive the SDK for you
--- a/docs/sdks/outbound-calls.mdx
+++ b/docs/sdks/outbound-calls.mdx
@ -0,0 +1,49 @@
+---
+title: "Place an outbound call"
+description: "Trigger a Dograh voice agent to call a phone number from the SDK"
+---
+
+Use the SDK to place a test outbound call from a specific agent to a phone number. This is the same endpoint used by the **Test Call** button in the Dograh UI.
+
+## Prerequisites
+
+- A Dograh [API key](/configurations/api-keys) exported as `DOGRAH_API_KEY`
+- A published agent (you need the agent ID)
+- A configured telephony provider — see [Telephony](/integrations/telephony/overview) for Twilio, Vonage, and other setups
+
+## Place the call
+
+<CodeGroup>
+```python Python
+from dograh_sdk import DograhClient
+from dograh_sdk._generated_models import InitiateCallRequest
+
+with DograhClient(api_key="YOUR_API_KEY") as client:
+    client.test_phone_call(
+        body=InitiateCallRequest(
+            workflow_id=123,
+            phone_number="+14155551234",
+        )
+    )
+```
+```typescript TypeScript
+import { DograhClient } from "@dograh/sdk";
+
+const client = new DograhClient({ apiKey: "YOUR_API_KEY" });
+
+await client.testPhoneCall({
+    body: {
+        workflow_id: 123,
+        phone_number: "+14155551234",
+    },
+});
+```
+</CodeGroup>
+
+## Inspect the run
+
+Every call creates a **run** you can inspect afterwards. See [Calls & runs](/core-concepts/calls-and-runs) for what's tracked, or use the [Runs API](/api-reference/agents/runs/list) to list and fetch runs programmatically.
+
+## Bulk campaigns
+
+For placing many calls at once (say, from a CSV), use [Campaigns](/core-concepts/campaigns) rather than looping over `test_phone_call` — campaigns handle pacing, retries, and progress tracking.
--- a/docs/voice-agent/pre-call-data-fetch.mdx
+++ b/docs/voice-agent/pre-call-data-fetch.mdx
@ -1,7 +1,6 @@
 ---
 title: "Pre-Call Data Fetch"
 description: "Fetch customer data from your CRM or ERP before the call starts, so your voice agent can greet callers by name and reference their account details."
-tag: "NEW"
 ---

 Pre-Call Data Fetch allows you to enrich the call context with external data before the voice agent starts speaking. When enabled on the **Start Call** node, Dograh sends an HTTP request to your API as soon as a call is initiated. While the response is loading, the caller hears a ring-back tone. Once the data arrives, it is merged into the call's [initial context](/core-concepts/context-and-variables#initial_context) and becomes available as template variables in your prompts and greetings.
--- a/docs/voice-agent/pre-recorded-audio.mdx
+++ b/docs/voice-agent/pre-recorded-audio.mdx
@ -1,7 +1,6 @@
 ---
 title: "Pre-recorded Audio"
 description: "Build hybrid voice agents that combine pre-recorded audio with dynamic text generation for lower latency, reduced TTS costs, and natural-sounding conversations."
-tag: "NEW"
 ---

 Custom recordings allow you to build **hybrid voice agents** that use your own pre-recorded audio for key parts of the conversation, while falling back to LLM-generated speech (via a cloned voice) for dynamic responses. This gives you the best of both worlds — the emotional depth of real human speech and the flexibility of AI-generated dialogue.
--- a/2
+++ b/2
@ -1 +1 @@
-Subproject commit edefaad42b97e52a3ad5eef8d15115a5c6ba3b11
+Subproject commit a6869df4bc7de8bd14f0533f7112f7d6a24891d9
--- a/scripts/generate_sdk.sh
+++ b/scripts/generate_sdk.sh
@ -0,0 +1,109 @@
+#!/usr/bin/env bash
+# Regenerate every file the SDKs derive from authoritative backend state:
+#
+#   1. Typed node dataclasses / TS interfaces (from node_specs registry)
+#   2. Filtered OpenAPI spec (routes tagged via @sdk_expose)
+#   3. Pydantic request/response models + TS interfaces (datamodel-codegen
+#      / openapi-typescript)
+#   4. Client method mixins (_generated_client.py / _generated_client.ts)
+#
+# Run from anywhere — the script resolves the repo root relative to itself.
+# Requires:
+#   - `python` in the `dograh` conda env, `api/.env` sourced; the `api`
+#     package must be importable. `datamodel-code-generator` installed
+#     (`pip install datamodel-code-generator`).
+#   - `node` (>= 22.6 for native .mts support) and npm. openapi-typescript
+#     is a devDependency of sdk/typescript; `npm install` in that dir is
+#     done for you if node_modules is missing.
+#
+# Invoked manually after editing any NodeSpec or after adding/removing an
+# `@sdk_expose` decorator. CI runs this and asserts the git diff is empty.
+
+set -euo pipefail
+
+REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
+cd "$REPO_ROOT"
+
+if [ -f "$REPO_ROOT/api/.env" ]; then
+    set -a
+    # shellcheck disable=SC1091
+    source "$REPO_ROOT/api/.env"
+    set +a
+fi
+
+SPECS_JSON="$(mktemp -t dograh-specs-XXXXXX.json)"
+OPENAPI_JSON="$(mktemp -t dograh-openapi-XXXXXX.json)"
+trap 'rm -f "$SPECS_JSON" "$OPENAPI_JSON"' EXIT
+
+# ── 1. Node-spec typed dataclasses ────────────────────────────────────
+
+echo "→ Dumping node specs from in-process registry..."
+python -m api.services.workflow.node_specs > "$SPECS_JSON"
+
+echo "→ Generating Python typed dataclasses..."
+PYTHONPATH="$REPO_ROOT/sdk/python/src" python -m dograh_sdk.codegen \
+    --input "$SPECS_JSON" \
+    --out "sdk/python/src/dograh_sdk/typed"
+
+echo "→ Generating TypeScript typed interfaces..."
+node "sdk/typescript/scripts/codegen.mts" \
+    --input "$SPECS_JSON" \
+    --out "sdk/typescript/src/typed"
+
+# ── 2. SDK-scoped OpenAPI spec ────────────────────────────────────────
+
+echo "→ Dumping filtered OpenAPI (sdk_expose routes only)..."
+python - <<PY
+import json
+from loguru import logger
+logger.remove()
+from fastapi.openapi.utils import get_openapi
+from api.app import app
+
+sdk_routes = [
+    r for r in app.routes
+    if getattr(r, "openapi_extra", None)
+    and "x-sdk-method" in (r.openapi_extra or {})
+]
+spec = get_openapi(title=app.title, version=app.version, routes=sdk_routes)
+with open("$OPENAPI_JSON", "w") as f:
+    json.dump(spec, f)
+print(f"  → {len(sdk_routes)} operations, "
+      f"{len(spec.get('components', {}).get('schemas', {}))} schemas reachable")
+PY
+
+# ── 3. Request/response models (off-the-shelf) ────────────────────────
+
+echo "→ Generating Python Pydantic models (datamodel-codegen)..."
+datamodel-codegen \
+    --input "$OPENAPI_JSON" \
+    --input-file-type openapi \
+    --output "sdk/python/src/dograh_sdk/_generated_models.py" \
+    --output-model-type pydantic_v2.BaseModel \
+    --target-python-version 3.10 \
+    --use-schema-description \
+    --use-field-description \
+    --use-annotated \
+    --use-union-operator \
+    --field-constraints \
+    --wrap-string-literal
+
+echo "→ Generating TypeScript types (openapi-typescript)..."
+if [ ! -d "sdk/typescript/node_modules" ]; then
+    (cd sdk/typescript && npm install --silent)
+fi
+(cd sdk/typescript && npx --no-install openapi-typescript \
+    "$OPENAPI_JSON" \
+    --output "src/_generated_models.ts" \
+    --root-types \
+    --root-types-no-schema-prefix)
+
+# ── 4. Client method mixins ──────────────────────────────────────────
+
+echo "→ Emitting client method mixins..."
+python -m sdk.codegen.client_codegen \
+    --input "$OPENAPI_JSON" \
+    --py-out "sdk/python/src/dograh_sdk/_generated_client.py" \
+    --ts-out "sdk/typescript/src/_generated_client.ts"
+
+echo "✓ SDK regenerated."
--- a/scripts/release_sdks.sh
+++ b/scripts/release_sdks.sh
@ -0,0 +1,123 @@
+#!/usr/bin/env bash
+# Cut a release of both SDKs — dograh-sdk (PyPI) and @dograh/sdk (npm) —
+# at the given version. Regenerates typed files from node_specs first so
+# a stale SDK can't ship.
+#
+# Usage:
+#   ./scripts/release_sdks.sh 0.1.2
+#
+# Prerequisites (one-time setup):
+#   - `build` + `twine` installed: `pip install --upgrade build twine`
+#   - `npm login` completed as a member of the `dograh` npm org. npm
+#     publish will prompt interactively for a 2FA OTP — run this script
+#     in a terminal where you can type the code.
+#
+# The script is idempotent up to the upload steps: each publish is gated
+# by a y/N prompt, so you can dry-run the build and bail before anything
+# hits a registry.
+
+set -euo pipefail
+
+VERSION="${1:-}"
+if [[ -z "$VERSION" ]]; then
+    echo "usage: $0 <version>   # e.g. 0.1.2" >&2
+    exit 1
+fi
+if ! [[ "$VERSION" =~ ^[0-9]+\.[0-9]+\.[0-9]+([.\-][A-Za-z0-9.]+)?$ ]]; then
+    echo "error: '$VERSION' does not look like semver (e.g. 0.1.2 or 0.2.0-rc.1)" >&2
+    exit 1
+fi
+
+REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
+cd "$REPO_ROOT"
+
+confirm() {
+    local reply
+    read -r -p "$1 [y/N] " reply
+    [[ "$reply" =~ ^[Yy]$ ]]
+}
+
+echo "→ Regenerating typed SDK sources from node_specs..."
+./scripts/generate_sdk.sh
+
+if ! git diff --quiet -- sdk/python/src/dograh_sdk/typed sdk/typescript/src/typed; then
+    echo
+    echo "⚠  node_specs regeneration changed typed files. Review the diff"
+    echo "   above and commit before releasing — otherwise the tag will"
+    echo "   point at a tree that disagrees with what ships to the registry."
+    if ! confirm "Continue anyway?"; then
+        exit 1
+    fi
+fi
+
+echo "→ Bumping versions to $VERSION..."
+VERSION="$VERSION" python - <<'PY'
+import os
+import pathlib
+import re
+
+version = os.environ["VERSION"]
+
+py = pathlib.Path("sdk/python/pyproject.toml")
+py.write_text(
+    re.sub(r'^version = "[^"]+"', f'version = "{version}"', py.read_text(), count=1, flags=re.M)
+)
+
+ts = pathlib.Path("sdk/typescript/package.json")
+ts.write_text(
+    re.sub(r'"version": "[^"]+"', f'"version": "{version}"', ts.read_text(), count=1)
+)
+
+print(f"  pyproject.toml → {version}")
+print(f"  package.json  → {version}")
+PY
+
+echo "→ Building Python wheel + sdist..."
+(
+    cd sdk/python
+    rm -rf dist build
+    python -m build >/dev/null
+    twine check dist/*
+)
+
+echo "→ Building TypeScript + running tests..."
+(
+    cd sdk/typescript
+    rm -rf dist
+    npm ci --silent
+    npm run build
+    npm test
+)
+
+echo
+echo "============================================================"
+echo "  Built dograh-sdk==$VERSION and @dograh/sdk@$VERSION"
+echo "  Nothing has been published yet."
+echo "============================================================"
+echo
+
+if confirm "Upload dograh-sdk==$VERSION to TestPyPI first (recommended)?"; then
+    (cd sdk/python && twine upload --repository testpypi dist/*)
+    echo "  → https://test.pypi.org/project/dograh-sdk/$VERSION/"
+    echo
+fi
+
+if confirm "Upload dograh-sdk==$VERSION to PyPI?"; then
+    (cd sdk/python && twine upload dist/*)
+    echo "  → https://pypi.org/project/dograh-sdk/$VERSION/"
+    echo
+fi
+
+if confirm "Publish @dograh/sdk@$VERSION to npm? (will prompt for 2FA OTP)"; then
+    (cd sdk/typescript && npm publish --access public)
+    echo "  → https://www.npmjs.com/package/@dograh/sdk/v/$VERSION"
+    echo
+fi
+
+if confirm "Create annotated git tag sdks-v$VERSION at HEAD?"; then
+    git tag -a "sdks-v$VERSION" -m "dograh-sdk + @dograh/sdk $VERSION"
+    echo "  → created tag (not pushed). Push with:"
+    echo "     git push origin sdks-v$VERSION"
+fi
+
+echo "✓ Done."
--- a/sdk/codegen/init.py
+++ b/sdk/codegen/init.py
--- a/sdk/codegen/client_codegen.py
+++ b/sdk/codegen/client_codegen.py
@ -0,0 +1,355 @@
+"""Generate SDK client mixins (Python + TypeScript) from a filtered OpenAPI dump.
+
+Input: a spec produced by calling FastAPI's `get_openapi(routes=...)` with
+only the routes tagged via `sdk_expose(...)`. Because it's already filtered,
+this script does *no* filtering — it just walks the operations and emits
+typed method stubs.
+
+Request/response types come from sibling model files already produced by
+`datamodel-codegen` (Python) and `openapi-typescript --root-types
+--root-types-no-schema-prefix` (TypeScript). We only import the names
+here; this script doesn't generate types itself.
+
+Output:
+    --py-out  sdk/python/src/dograh_sdk/_generated_client.py
+    --ts-out  sdk/typescript/src/_generated_client.ts
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+
+
+_API_PREFIX = "/api/v1"
+
+# openapi scalar → (python, typescript)
+_TYPE_MAP = {
+    "integer": ("int", "number"),
+    "number": ("float", "number"),
+    "string": ("str", "string"),
+    "boolean": ("bool", "boolean"),
+}
+
+
+def _map_scalar(schema: dict[str, Any]) -> tuple[str, str]:
+    t = schema.get("type")
+    if t in _TYPE_MAP:
+        return _TYPE_MAP[t]
+    # optional string often shown as anyOf:[{type:string}, {type:null}]
+    for branch in schema.get("anyOf") or []:
+        if branch.get("type") in _TYPE_MAP and branch.get("type") != "null":
+            return _TYPE_MAP[branch["type"]]
+    return ("Any", "unknown")
+
+
+def _ref_name(schema: dict[str, Any]) -> str | None:
+    ref = schema.get("$ref")
+    if isinstance(ref, str) and ref.startswith("#/components/schemas/"):
+        return ref.rsplit("/", 1)[-1]
+    return None
+
+
+@dataclass
+class ResponseType:
+    """What comes back from an operation. `class_name` is a model class from
+    `_generated_models`; `is_list` wraps it as a list."""
+    class_name: str | None = None
+    is_list: bool = False
+
+    @property
+    def py(self) -> str:
+        if self.class_name is None:
+            return "Any"
+        return f"list[{self.class_name}]" if self.is_list else self.class_name
+
+    @property
+    def ts(self) -> str:
+        if self.class_name is None:
+            return "unknown"
+        return f"{self.class_name}[]" if self.is_list else self.class_name
+
+
+@dataclass
+class Param:
+    name: str
+    py_type: str
+    ts_type: str
+    required: bool
+
+
+@dataclass
+class Operation:
+    method: str
+    verb: str
+    path: str
+    description: str
+    path_params: list[Param] = field(default_factory=list)
+    query_params: list[Param] = field(default_factory=list)
+    request_class: str | None = None        # None → no body
+    response: ResponseType = field(default_factory=ResponseType)
+
+
+def _collect(spec: dict[str, Any]) -> list[Operation]:
+    ops: list[Operation] = []
+    used_models: set[str] = set()
+
+    for path, methods in spec.get("paths", {}).items():
+        for verb, op in methods.items():
+            if not isinstance(op, dict) or "x-sdk-method" not in op:
+                continue
+
+            description = (op.get("x-sdk-description") or op.get("summary") or "").strip()
+            sdk_path = path[len(_API_PREFIX):] if path.startswith(_API_PREFIX) else path
+
+            path_params: list[Param] = []
+            query_params: list[Param] = []
+            for p in op.get("parameters") or []:
+                py_t, ts_t = _map_scalar(p.get("schema") or {})
+                param = Param(
+                    name=p["name"],
+                    py_type=py_t,
+                    ts_type=ts_t,
+                    required=bool(p.get("required")),
+                )
+                if p.get("in") == "path":
+                    path_params.append(param)
+                elif p.get("in") == "query":
+                    query_params.append(param)
+
+            request_class: str | None = None
+            rb = op.get("requestBody") or {}
+            rb_schema = (
+                (rb.get("content") or {}).get("application/json", {}).get("schema") or {}
+            )
+            if rb_schema:
+                request_class = _ref_name(rb_schema)
+
+            response = ResponseType()
+            r200 = (
+                op.get("responses", {})
+                .get("200", {})
+                .get("content", {})
+                .get("application/json", {})
+                .get("schema")
+                or {}
+            )
+            if r200:
+                name = _ref_name(r200)
+                if name:
+                    response = ResponseType(class_name=name)
+                elif r200.get("type") == "array":
+                    item = r200.get("items") or {}
+                    name = _ref_name(item)
+                    if name:
+                        response = ResponseType(class_name=name, is_list=True)
+
+            for cls in (request_class, response.class_name):
+                if cls:
+                    used_models.add(cls)
+
+            ops.append(Operation(
+                method=op["x-sdk-method"],
+                verb=verb.lower(),
+                path=sdk_path,
+                description=description,
+                path_params=path_params,
+                query_params=query_params,
+                request_class=request_class,
+                response=response,
+            ))
+
+    ops.sort(key=lambda o: o.method)
+    return ops, sorted(used_models)
+
+
+# ── Python emitter ─────────────────────────────────────────────────────
+
+
+def _py_method(op: Operation) -> str:
+    positional = [f"{p.name}: {p.py_type}" for p in op.path_params]
+    kw_only: list[str] = []
+    if op.request_class:
+        kw_only.append(f"body: {op.request_class}")
+    for p in op.query_params:
+        kw_only.append(f"{p.name}: {p.py_type} | None = None")
+
+    sig = ", ".join(["self", *positional] + (["*"] + kw_only if kw_only else []))
+
+    lines: list[str] = []
+    lines.append(f"    def {op.method}({sig}) -> {op.response.py}:")
+    lines.append(f'        """{op.description or op.verb.upper() + " " + op.path}"""')
+
+    path_expr = f'f"{op.path}"' if op.path_params else f'"{op.path}"'
+
+    call_kwargs: list[str] = []
+    if op.query_params:
+        lines.append("        params: dict[str, Any] = {}")
+        for p in op.query_params:
+            lines.append(f"        if {p.name} is not None:")
+            lines.append(f'            params["{p.name}"] = {p.name}')
+        call_kwargs.append("params=params")
+    if op.request_class:
+        call_kwargs.append('json=body.model_dump(mode="json", exclude_none=True)')
+
+    extra = (", " + ", ".join(call_kwargs)) if call_kwargs else ""
+    raw_call = f'self._request("{op.verb.upper()}", {path_expr}{extra})'
+
+    if op.response.class_name is None:
+        lines.append(f"        return {raw_call}")
+    elif op.response.is_list:
+        lines.append(f"        data = {raw_call}")
+        lines.append(f"        return [{op.response.class_name}.model_validate(x) for x in data]")
+    else:
+        lines.append(f"        data = {raw_call}")
+        lines.append(f"        return {op.response.class_name}.model_validate(data)")
+
+    lines.append("")
+    return "\n".join(lines)
+
+
+_PY_HEADER = '''\
+"""GENERATED — do not edit. Source: filtered OpenAPI from `api.app`.
+
+Regenerate with `./scripts/generate_sdk.sh`.
+
+`DograhClient` mixes in this class to get HTTP methods for every route
+decorated with `sdk_expose(...)` on the backend. Request/response types
+come from `_generated_models` (datamodel-codegen output).
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+from dograh_sdk._generated_models import (
+{imports}
+)
+
+
+class _GeneratedClient:
+    # `DograhClient.__init__` installs `self._request` (see client.py).
+
+'''
+
+
+def emit_python(ops: list[Operation], models: list[str]) -> str:
+    imports = "\n".join(f"    {m}," for m in models)
+    body = "\n".join(_py_method(op) for op in ops)
+    return _PY_HEADER.format(imports=imports) + body
+
+
+# ── TypeScript emitter ─────────────────────────────────────────────────
+
+
+def _snake_to_camel(s: str) -> str:
+    parts = s.split("_")
+    return parts[0] + "".join(p.title() for p in parts[1:])
+
+
+def _ts_method(op: Operation) -> str:
+    name = _snake_to_camel(op.method)
+    positional = [f"{_snake_to_camel(p.name)}: {p.ts_type}" for p in op.path_params]
+
+    opts_props: list[str] = []
+    if op.request_class:
+        opts_props.append(f"body: {op.request_class}")
+    for p in op.query_params:
+        opts_props.append(f"{_snake_to_camel(p.name)}?: {p.ts_type}")
+
+    args = list(positional)
+    if opts_props:
+        required_in_opts = op.request_class is not None
+        opts_sig = "{ " + "; ".join(opts_props) + " }"
+        # If body is required, opts is required too (no `= {}` default)
+        args.append(f"opts: {opts_sig}" if required_in_opts else f"opts: {opts_sig} = {{}}")
+
+    sig = ", ".join(args)
+    ret = op.response.ts
+
+    lines: list[str] = []
+    lines.append(f"    /** {op.description or op.verb.upper() + ' ' + op.path} */")
+    lines.append(f"    async {name}({sig}): Promise<{ret}> {{")
+
+    path_expr = op.path
+    for p in op.path_params:
+        path_expr = path_expr.replace("{" + p.name + "}", "${" + _snake_to_camel(p.name) + "}")
+    tmpl = f"`{path_expr}`" if op.path_params else f'"{op.path}"'
+
+    call_opts: list[str] = []
+    if op.query_params:
+        entries: list[str] = []
+        for p in op.query_params:
+            camel = _snake_to_camel(p.name)
+            entries.append(f'            ...(opts.{camel} !== undefined ? {{ "{p.name}": opts.{camel} }} : {{}}),')
+        lines.append("        const params: Record<string, unknown> = {")
+        lines.extend(entries)
+        lines.append("        };")
+        call_opts.append("params")
+    if op.request_class:
+        call_opts.append("json: opts.body")
+
+    extra = (", { " + ", ".join(call_opts) + " }") if call_opts else ""
+    generic = f"<{ret}>" if ret != "unknown" else ""
+    lines.append(f'        return this.request{generic}("{op.verb.upper()}", {tmpl}{extra});')
+    lines.append("    }")
+    lines.append("")
+    return "\n".join(lines)
+
+
+_TS_HEADER = """\
+// GENERATED — do not edit. Source: filtered OpenAPI from `api.app`.
+//
+// Regenerate with `./scripts/generate_sdk.sh`.
+//
+// `DograhClient` extends this base to get HTTP methods for every route
+// decorated with `sdk_expose(...)`. Request/response types come from
+// `_generated_models` (openapi-typescript output, --root-types).
+
+import type {{
+{imports}
+}} from "./_generated_models.js";
+
+export abstract class _GeneratedClient {{
+    protected abstract request<T = unknown>(
+        method: string,
+        path: string,
+        opts?: {{ json?: unknown; params?: Record<string, unknown> }},
+    ): Promise<T>;
+
+"""
+
+
+def emit_typescript(ops: list[Operation], models: list[str]) -> str:
+    imports = "\n".join(f"    {m}," for m in models)
+    body = "\n".join(_ts_method(op) for op in ops)
+    return _TS_HEADER.format(imports=imports) + body + "}\n"
+
+
+# ── CLI ────────────────────────────────────────────────────────────────
+
+
+def main() -> None:
+    ap = argparse.ArgumentParser(description=__doc__)
+    ap.add_argument("--input", required=True, help="Path to filtered openapi.json")
+    ap.add_argument("--py-out", required=True)
+    ap.add_argument("--ts-out", required=True)
+    args = ap.parse_args()
+
+    spec = json.loads(Path(args.input).read_text())
+    ops, models = _collect(spec)
+    if not ops:
+        raise SystemExit("No x-sdk-method operations — nothing to emit.")
+
+    Path(args.py_out).write_text(emit_python(ops, models))
+    Path(args.ts_out).write_text(emit_typescript(ops, models))
+    print(f"  → {len(ops)} operations, {len(models)} models referenced")
+    print(f"  → {args.py_out}")
+    print(f"  → {args.ts_out}")
+
+
+if __name__ == "__main__":
+    main()
--- a/sdk/python/.gitignore
+++ b/sdk/python/.gitignore
@ -0,0 +1,3 @@
+dist/
+build/
+*.egg-info/
--- a/sdk/python/LICENSE
+++ b/sdk/python/LICENSE
@ -0,0 +1,24 @@
+BSD 2-Clause License
+
+Copyright (c) 2025, Zansat Technologies Private Limited
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+1. Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+
+2. Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
--- a/sdk/python/README.md
+++ b/sdk/python/README.md
@ -0,0 +1,77 @@
+# dograh-sdk
+
+Typed builder for Dograh voice-AI workflows. Fetches the node-spec catalog from
+the Dograh backend at session start, validates every call against it at the
+call site, and produces `ReactFlowDTO`-compatible JSON.
+
+## Install
+
+```bash
+pip install dograh-sdk
+```
+
+For local development against a checked-out monorepo:
+
+```bash
+pip install -e sdk/python/
+```
+
+## Usage
+
+```python
+from dograh_sdk import DograhClient, Workflow
+
+with DograhClient(base_url="http://localhost:8000", api_key="...") as client:
+    wf = Workflow(client=client, name="loan_qualification")
+
+    start = wf.add(
+        type="startCall",
+        name="greeting",
+        prompt="You are Sarah from Acme Loans. Greet the caller warmly.",
+        greeting_type="text",
+        greeting="Hi {{first_name}}, this is Sarah.",
+    )
+    qualify = wf.add(
+        type="agentNode",
+        name="qualify",
+        prompt="Ask about loan amount and timeline.",
+    )
+    done = wf.add(type="endCall", name="done", prompt="Thank the caller.")
+
+    wf.edge(start, qualify, label="interested", condition="Caller expressed interest.")
+    wf.edge(qualify, done, label="done", condition="Qualification complete.")
+
+    client.save_workflow(workflow_id=123, workflow=wf)
+```
+
+## What gets validated at the call site
+
+The SDK fetches the spec for each node type via `get_node_type` and raises
+`ValidationError` immediately when:
+
+- an unknown field is passed (catches typos)
+- a required field is missing or empty
+- a scalar type is wrong (e.g., string for a boolean)
+- an `options` value isn't in the allowed list
+
+When a spec carries an `llm_hint`, the hint is appended to the error message so
+an LLM agent can self-correct on retry:
+
+```
+tool_uuids: expected tool_refs, got str
+  Hint: List of tool UUIDs from `list_tools`.
+```
+
+Server-side Pydantic validators run on save and surface anything the SDK lets
+through (compound invariants, cross-field rules).
+
+## Environment
+
+```bash
+DOGRAH_API_URL=http://localhost:8000   # default
+DOGRAH_API_KEY=sk-...                  # sent as X-API-Key
+```
+
+## License
+
+BSD 2-Clause — see `LICENSE`.
--- a/sdk/python/pyproject.toml
+++ b/sdk/python/pyproject.toml
@ -0,0 +1,49 @@
+[project]
+name = "dograh-sdk"
+version = "0.1.2"
+description = "Typed builder for Dograh voice-AI workflows"
+readme = "README.md"
+requires-python = ">=3.10"
+license = { text = "BSD-2-Clause" }
+authors = [
+    { name = "Zansat Technologies Private Limited", email = "contact@dograh.com" },
+]
+keywords = ["dograh", "voice-ai", "workflow", "sdk", "llm", "agent"]
+classifiers = [
+    "Development Status :: 3 - Alpha",
+    "Intended Audience :: Developers",
+    "License :: OSI Approved :: BSD License",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+    "Programming Language :: Python :: 3.13",
+    "Topic :: Software Development :: Libraries",
+]
+dependencies = [
+    "httpx>=0.27",
+    "pydantic>=2.0",
+]
+
+[project.optional-dependencies]
+dev = [
+    "pytest>=7.0",
+]
+
+[project.urls]
+Homepage = "https://dograh.com"
+Documentation = "https://docs.dograh.com"
+Repository = "https://github.com/dograh-hq/dograh"
+
+[project.scripts]
+dograh-sdk-codegen = "dograh_sdk.codegen:main"
+
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+
+[tool.hatch.build.targets.wheel]
+packages = ["src/dograh_sdk"]
+
+[tool.pytest.ini_options]
+testpaths = ["tests"]
--- a/sdk/python/src/dograh_sdk/init.py
+++ b/sdk/python/src/dograh_sdk/init.py
@ -0,0 +1,35 @@
+"""Dograh SDK — typed builder for voice-AI workflows.
+
+Runtime SDK: fetches the spec catalog from the Dograh backend at session
+start and validates every `Workflow.add()` call against it. LLMs don't
+need to import per-node-type classes — the `type` argument is a string
+keyed against the fetched spec catalog.
+
+    from dograh_sdk import DograhClient, Workflow
+
+    with DograhClient(base_url="http://localhost:8000", api_key=...) as client:
+        wf = Workflow(client=client, name="loan_qualification")
+        start = wf.add(type="startCall", name="greeting", prompt="...")
+        qualify = wf.add(type="agentNode", name="qualify", prompt="...")
+        wf.edge(start, qualify, label="interested", condition="...")
+        client.save_workflow(workflow_id=123, workflow=wf)
+
+For typed IDE autocomplete, generate per-node dataclasses via the SDK
+codegen (Phase 6) — the runtime and typed SDKs share this same core.
+"""
+
+from .client import DograhClient
+from .errors import ApiError, DograhSdkError, SpecMismatchError, ValidationError
+from .typed._base import TypedNode
+from .workflow import NodeRef, Workflow
+
+__all__ = [
+    "ApiError",
+    "DograhClient",
+    "DograhSdkError",
+    "NodeRef",
+    "SpecMismatchError",
+    "TypedNode",
+    "ValidationError",
+    "Workflow",
+]
--- a/sdk/python/src/dograh_sdk/_generated_client.py
+++ b/sdk/python/src/dograh_sdk/_generated_client.py
@ -0,0 +1,102 @@
+"""GENERATED — do not edit. Source: filtered OpenAPI from `api.app`.
+
+Regenerate with `./scripts/generate_sdk.sh`.
+
+`DograhClient` mixes in this class to get HTTP methods for every route
+decorated with `sdk_expose(...)` on the backend. Request/response types
+come from `_generated_models` (datamodel-codegen output).
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+from dograh_sdk._generated_models import (
+    CredentialResponse,
+    DocumentListResponseSchema,
+    InitiateCallRequest,
+    NodeSpec,
+    NodeTypesResponse,
+    RecordingListResponseSchema,
+    ToolResponse,
+    UpdateWorkflowRequest,
+    WorkflowListResponse,
+    WorkflowResponse,
+)
+
+
+class _GeneratedClient:
+    # `DograhClient.__init__` installs `self._request` (see client.py).
+
+    def get_node_type(self, name: str) -> NodeSpec:
+        """Fetch a single node spec by name."""
+        data = self._request("GET", f"/node-types/{name}")
+        return NodeSpec.model_validate(data)
+
+    def get_workflow(self, workflow_id: int) -> WorkflowResponse:
+        """Get a single workflow by ID (returns draft if one exists, else published)."""
+        data = self._request("GET", f"/workflow/fetch/{workflow_id}")
+        return WorkflowResponse.model_validate(data)
+
+    def list_credentials(self) -> list[CredentialResponse]:
+        """List webhook credentials available to the authenticated organization."""
+        data = self._request("GET", "/credentials/")
+        return [CredentialResponse.model_validate(x) for x in data]
+
+    def list_documents(self, *, status: str | None = None, limit: int | None = None, offset: int | None = None) -> DocumentListResponseSchema:
+        """List knowledge base documents available to the authenticated organization."""
+        params: dict[str, Any] = {}
+        if status is not None:
+            params["status"] = status
+        if limit is not None:
+            params["limit"] = limit
+        if offset is not None:
+            params["offset"] = offset
+        data = self._request("GET", "/knowledge-base/documents", params=params)
+        return DocumentListResponseSchema.model_validate(data)
+
+    def list_node_types(self) -> NodeTypesResponse:
+        """List every registered node type with its spec. Pinned to spec_version."""
+        data = self._request("GET", "/node-types")
+        return NodeTypesResponse.model_validate(data)
+
+    def list_recordings(self, *, workflow_id: int | None = None, tts_provider: str | None = None, tts_model: str | None = None, tts_voice_id: str | None = None) -> RecordingListResponseSchema:
+        """List workflow recordings available to the authenticated organization."""
+        params: dict[str, Any] = {}
+        if workflow_id is not None:
+            params["workflow_id"] = workflow_id
+        if tts_provider is not None:
+            params["tts_provider"] = tts_provider
+        if tts_model is not None:
+            params["tts_model"] = tts_model
+        if tts_voice_id is not None:
+            params["tts_voice_id"] = tts_voice_id
+        data = self._request("GET", "/workflow-recordings/", params=params)
+        return RecordingListResponseSchema.model_validate(data)
+
+    def list_tools(self, *, status: str | None = None, category: str | None = None) -> list[ToolResponse]:
+        """List tools available to the authenticated organization."""
+        params: dict[str, Any] = {}
+        if status is not None:
+            params["status"] = status
+        if category is not None:
+            params["category"] = category
+        data = self._request("GET", "/tools/", params=params)
+        return [ToolResponse.model_validate(x) for x in data]
+
+    def list_workflows(self, *, status: str | None = None) -> list[WorkflowListResponse]:
+        """List all workflows in the authenticated organization."""
+        params: dict[str, Any] = {}
+        if status is not None:
+            params["status"] = status
+        data = self._request("GET", "/workflow/fetch", params=params)
+        return [WorkflowListResponse.model_validate(x) for x in data]
+
+    def test_phone_call(self, *, body: InitiateCallRequest) -> Any:
+        """Place a test call from a workflow to a phone number."""
+        return self._request("POST", "/telephony/initiate-call", json=body.model_dump(mode="json", exclude_none=True))
+
+    def update_workflow(self, workflow_id: int, *, body: UpdateWorkflowRequest) -> WorkflowResponse:
+        """Update a workflow's name and/or definition. Saves as a new draft."""
+        data = self._request("PUT", f"/workflow/{workflow_id}", json=body.model_dump(mode="json", exclude_none=True))
+        return WorkflowResponse.model_validate(data)
--- a/sdk/python/src/dograh_sdk/_generated_models.py
+++ b/sdk/python/src/dograh_sdk/_generated_models.py
@ -0,0 +1,358 @@
+# generated by datamodel-codegen:
+#   filename:  dograh-openapi-XXXXXX.json.oPRfLAwVZP
+#   timestamp: 2026-04-21T02:15:12+00:00
+
+from __future__ import annotations
+
+from enum import Enum
+from typing import Annotated, Any
+
+from pydantic import AwareDatetime, BaseModel, ConfigDict, Field
+
+
+class CallDispositionCodes(BaseModel):
+    disposition_codes: Annotated[list[str] | None, Field(title='Disposition Codes')] = (
+        []
+    )
+
+
+class CreatedByResponse(BaseModel):
+    """
+    Response schema for the user who created a tool.
+    """
+
+    id: Annotated[int, Field(title='Id')]
+    provider_id: Annotated[str, Field(title='Provider Id')]
+
+
+class CredentialResponse(BaseModel):
+    """
+    Response schema for a webhook credential (never includes sensitive data).
+    """
+
+    uuid: Annotated[str, Field(title='Uuid')]
+    name: Annotated[str, Field(title='Name')]
+    description: Annotated[str | None, Field(title='Description')]
+    credential_type: Annotated[str, Field(title='Credential Type')]
+    created_at: Annotated[AwareDatetime, Field(title='Created At')]
+    updated_at: Annotated[AwareDatetime | None, Field(title='Updated At')]
+
+
+class DisplayOptions(BaseModel):
+    """
+    Conditional visibility rules.
+
+    `show` keys are AND-combined: this property is visible only when EVERY
+    referenced field's value matches one of the listed values.
+
+    `hide` keys are OR-combined: this property is hidden when ANY referenced
+    field's value matches one of the listed values.
+
+    Example:
+        DisplayOptions(show={"extraction_enabled": [True]})
+        DisplayOptions(show={"greeting_type": ["audio"]})
+    """
+
+    model_config = ConfigDict(
+        extra='forbid',
+    )
+    show: Annotated[dict[str, list[Any]] | None, Field(title='Show')] = None
+    hide: Annotated[dict[str, list[Any]] | None, Field(title='Hide')] = None
+
+
+class DocumentResponseSchema(BaseModel):
+    """
+    Response schema for document metadata.
+    """
+
+    id: Annotated[int, Field(title='Id')]
+    document_uuid: Annotated[str, Field(title='Document Uuid')]
+    filename: Annotated[str, Field(title='Filename')]
+    file_size_bytes: Annotated[int, Field(title='File Size Bytes')]
+    file_hash: Annotated[str, Field(title='File Hash')]
+    mime_type: Annotated[str, Field(title='Mime Type')]
+    processing_status: Annotated[str, Field(title='Processing Status')]
+    processing_error: Annotated[str | None, Field(title='Processing Error')] = None
+    total_chunks: Annotated[int, Field(title='Total Chunks')]
+    retrieval_mode: Annotated[str | None, Field(title='Retrieval Mode')] = 'chunked'
+    custom_metadata: Annotated[dict[str, Any], Field(title='Custom Metadata')]
+    docling_metadata: Annotated[dict[str, Any], Field(title='Docling Metadata')]
+    source_url: Annotated[str | None, Field(title='Source Url')] = None
+    created_at: Annotated[AwareDatetime, Field(title='Created At')]
+    updated_at: Annotated[AwareDatetime, Field(title='Updated At')]
+    organization_id: Annotated[int, Field(title='Organization Id')]
+    created_by: Annotated[int, Field(title='Created By')]
+    is_active: Annotated[bool, Field(title='Is Active')]
+
+
+class GraphConstraints(BaseModel):
+    """
+    Per-node-type graph rules. WorkflowGraph enforces these at validation.
+    """
+
+    model_config = ConfigDict(
+        extra='forbid',
+    )
+    min_incoming: Annotated[int | None, Field(title='Min Incoming')] = None
+    max_incoming: Annotated[int | None, Field(title='Max Incoming')] = None
+    min_outgoing: Annotated[int | None, Field(title='Min Outgoing')] = None
+    max_outgoing: Annotated[int | None, Field(title='Max Outgoing')] = None
+
+
+class InitiateCallRequest(BaseModel):
+    workflow_id: Annotated[int, Field(title='Workflow Id')]
+    workflow_run_id: Annotated[int | None, Field(title='Workflow Run Id')] = None
+    phone_number: Annotated[str | None, Field(title='Phone Number')] = None
+
+
+class NodeCategory(Enum):
+    """
+    Drives grouping in the AddNodePanel UI.
+    """
+
+    call_node = 'call_node'
+    global_node = 'global_node'
+    trigger = 'trigger'
+    integration = 'integration'
+
+
+class NodeExample(BaseModel):
+    """
+    A worked example LLMs can pattern-match. Keep small and realistic.
+    """
+
+    model_config = ConfigDict(
+        extra='forbid',
+    )
+    name: Annotated[str, Field(title='Name')]
+    description: Annotated[str | None, Field(title='Description')] = None
+    data: Annotated[dict[str, Any], Field(title='Data')]
+
+
+class PropertyOption(BaseModel):
+    """
+    An option in an `options` or `multi_options` dropdown.
+    """
+
+    model_config = ConfigDict(
+        extra='forbid',
+    )
+    value: Annotated[str | int | bool | float, Field(title='Value')]
+    label: Annotated[str, Field(title='Label')]
+    description: Annotated[str | None, Field(title='Description')] = None
+
+
+class PropertyType(Enum):
+    """
+    Bounded vocabulary of property types the renderer dispatches on.
+
+    Adding a value here requires a matching arm in the frontend
+    `<PropertyInput>` switch and (where relevant) the SDK codegen template.
+    """
+
+    string = 'string'
+    number = 'number'
+    boolean = 'boolean'
+    options = 'options'
+    multi_options = 'multi_options'
+    fixed_collection = 'fixed_collection'
+    json = 'json'
+    tool_refs = 'tool_refs'
+    document_refs = 'document_refs'
+    recording_ref = 'recording_ref'
+    credential_ref = 'credential_ref'
+    mention_textarea = 'mention_textarea'
+    url = 'url'
+
+
+class RecordingResponseSchema(BaseModel):
+    """
+    Response schema for a single recording.
+    """
+
+    id: Annotated[int, Field(title='Id')]
+    recording_id: Annotated[str, Field(title='Recording Id')]
+    workflow_id: Annotated[int | None, Field(title='Workflow Id')] = None
+    organization_id: Annotated[int, Field(title='Organization Id')]
+    tts_provider: Annotated[str | None, Field(title='Tts Provider')] = None
+    tts_model: Annotated[str | None, Field(title='Tts Model')] = None
+    tts_voice_id: Annotated[str | None, Field(title='Tts Voice Id')] = None
+    transcript: Annotated[str, Field(title='Transcript')]
+    storage_key: Annotated[str, Field(title='Storage Key')]
+    storage_backend: Annotated[str, Field(title='Storage Backend')]
+    metadata: Annotated[dict[str, Any], Field(title='Metadata')]
+    created_by: Annotated[int, Field(title='Created By')]
+    created_at: Annotated[AwareDatetime, Field(title='Created At')]
+    is_active: Annotated[bool, Field(title='Is Active')]
+
+
+class ToolResponse(BaseModel):
+    """
+    Response schema for a tool.
+    """
+
+    id: Annotated[int, Field(title='Id')]
+    tool_uuid: Annotated[str, Field(title='Tool Uuid')]
+    name: Annotated[str, Field(title='Name')]
+    description: Annotated[str | None, Field(title='Description')]
+    category: Annotated[str, Field(title='Category')]
+    icon: Annotated[str | None, Field(title='Icon')]
+    icon_color: Annotated[str | None, Field(title='Icon Color')]
+    status: Annotated[str, Field(title='Status')]
+    definition: Annotated[dict[str, Any], Field(title='Definition')]
+    created_at: Annotated[AwareDatetime, Field(title='Created At')]
+    updated_at: Annotated[AwareDatetime | None, Field(title='Updated At')]
+    created_by: CreatedByResponse | None = None
+
+
+class UpdateWorkflowRequest(BaseModel):
+    name: Annotated[str | None, Field(title='Name')] = None
+    workflow_definition: Annotated[
+        dict[str, Any] | None, Field(title='Workflow Definition')
+    ] = None
+    template_context_variables: Annotated[
+        dict[str, Any] | None, Field(title='Template Context Variables')
+    ] = None
+    workflow_configurations: Annotated[
+        dict[str, Any] | None, Field(title='Workflow Configurations')
+    ] = None
+
+
+class ValidationError(BaseModel):
+    loc: Annotated[list[str | int], Field(title='Location')]
+    msg: Annotated[str, Field(title='Message')]
+    type: Annotated[str, Field(title='Error Type')]
+    input: Annotated[Any | None, Field(title='Input')] = None
+    ctx: Annotated[dict[str, Any] | None, Field(title='Context')] = None
+
+
+class WorkflowListResponse(BaseModel):
+    """
+    Lightweight response for workflow listings (excludes large fields).
+    """
+
+    id: Annotated[int, Field(title='Id')]
+    name: Annotated[str, Field(title='Name')]
+    status: Annotated[str, Field(title='Status')]
+    created_at: Annotated[AwareDatetime, Field(title='Created At')]
+    total_runs: Annotated[int, Field(title='Total Runs')]
+
+
+class WorkflowResponse(BaseModel):
+    id: Annotated[int, Field(title='Id')]
+    name: Annotated[str, Field(title='Name')]
+    status: Annotated[str, Field(title='Status')]
+    created_at: Annotated[AwareDatetime, Field(title='Created At')]
+    workflow_definition: Annotated[dict[str, Any], Field(title='Workflow Definition')]
+    current_definition_id: Annotated[int | None, Field(title='Current Definition Id')]
+    template_context_variables: Annotated[
+        dict[str, Any] | None, Field(title='Template Context Variables')
+    ] = None
+    call_disposition_codes: CallDispositionCodes | None = None
+    total_runs: Annotated[int | None, Field(title='Total Runs')] = None
+    workflow_configurations: Annotated[
+        dict[str, Any] | None, Field(title='Workflow Configurations')
+    ] = None
+    version_number: Annotated[int | None, Field(title='Version Number')] = None
+    version_status: Annotated[str | None, Field(title='Version Status')] = None
+
+
+class DocumentListResponseSchema(BaseModel):
+    """
+    Response schema for list of documents.
+    """
+
+    documents: Annotated[list[DocumentResponseSchema], Field(title='Documents')]
+    total: Annotated[int, Field(title='Total')]
+    limit: Annotated[int, Field(title='Limit')]
+    offset: Annotated[int, Field(title='Offset')]
+
+
+class HTTPValidationError(BaseModel):
+    detail: Annotated[list[ValidationError] | None, Field(title='Detail')] = None
+
+
+class PropertySpec(BaseModel):
+    """
+    Single field on a node.
+
+    `description` is HUMAN-FACING — shown under the field in the edit
+    dialog. Keep it concise and explain what the field does.
+
+    `llm_hint` is LLM-FACING — appears only in the `get_node_type` MCP
+    response and in SDK schema output. Use it for catalog tool references
+    (e.g., "Use `list_recordings`"), array shape, expected value idioms,
+    or anything that would be noise in the UI. Optional; omit when the
+    `description` already suffices for both audiences.
+    """
+
+    model_config = ConfigDict(
+        extra='forbid',
+    )
+    name: Annotated[str, Field(title='Name')]
+    type: PropertyType
+    display_name: Annotated[str, Field(title='Display Name')]
+    description: Annotated[str, Field(min_length=1, title='Description')]
+    """
+    Human-facing explanation shown in the UI.
+    """
+    llm_hint: Annotated[str | None, Field(title='Llm Hint')] = None
+    """
+    LLM-only guidance; omitted from the UI.
+    """
+    default: Annotated[Any | None, Field(title='Default')] = None
+    required: Annotated[bool | None, Field(title='Required')] = False
+    placeholder: Annotated[str | None, Field(title='Placeholder')] = None
+    display_options: DisplayOptions | None = None
+    options: Annotated[list[PropertyOption] | None, Field(title='Options')] = None
+    properties: Annotated[list[PropertySpec] | None, Field(title='Properties')] = None
+    min_value: Annotated[float | None, Field(title='Min Value')] = None
+    max_value: Annotated[float | None, Field(title='Max Value')] = None
+    min_length: Annotated[int | None, Field(title='Min Length')] = None
+    max_length: Annotated[int | None, Field(title='Max Length')] = None
+    pattern: Annotated[str | None, Field(title='Pattern')] = None
+    editor: Annotated[str | None, Field(title='Editor')] = None
+    extra: Annotated[dict[str, Any] | None, Field(title='Extra')] = None
+
+
+class RecordingListResponseSchema(BaseModel):
+    """
+    Response schema for list of recordings.
+    """
+
+    recordings: Annotated[list[RecordingResponseSchema], Field(title='Recordings')]
+    total: Annotated[int, Field(title='Total')]
+
+
+class NodeSpec(BaseModel):
+    """
+    Single source of truth for a node type.
+    """
+
+    model_config = ConfigDict(
+        extra='forbid',
+    )
+    name: Annotated[str, Field(title='Name')]
+    display_name: Annotated[str, Field(title='Display Name')]
+    description: Annotated[str, Field(min_length=1, title='Description')]
+    """
+    Human-facing explanation shown in AddNodePanel.
+    """
+    llm_hint: Annotated[str | None, Field(title='Llm Hint')] = None
+    """
+    LLM-only guidance; omitted from the UI.
+    """
+    category: NodeCategory
+    icon: Annotated[str, Field(title='Icon')]
+    version: Annotated[str | None, Field(title='Version')] = '1.0.0'
+    properties: Annotated[list[PropertySpec], Field(title='Properties')]
+    examples: Annotated[list[NodeExample] | None, Field(title='Examples')] = None
+    graph_constraints: GraphConstraints | None = None
+
+
+class NodeTypesResponse(BaseModel):
+    spec_version: Annotated[str, Field(title='Spec Version')]
+    node_types: Annotated[list[NodeSpec], Field(title='Node Types')]
+
+
+PropertySpec.model_rebuild()
--- a/sdk/python/src/dograh_sdk/_validation.py
+++ b/sdk/python/src/dograh_sdk/_validation.py
@ -0,0 +1,166 @@
+"""Client-side validation of node data against a fetched spec.
+
+Intentionally lightweight: we catch the hallucinations that matter (typo'd
+field names, missing required fields, obvious scalar-type mismatches) and
+leave rigorous coercion to the backend's Pydantic validators, which run at
+save time. The tradeoff: the SDK fails fast on mistakes an LLM makes, and
+the backend remains the single authority on wire-format correctness.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+from .errors import ValidationError
+
+# Map PropertyType → primitive Python type(s) we check at call site.
+# `None` means "skip scalar-type check" (compound types, refs, JSON, etc.).
+_SCALAR_TYPES: dict[str, tuple[type, ...] | None] = {
+    "string": (str,),
+    "number": (int, float),
+    "boolean": (bool,),
+    "options": None,  # value-in-options handled separately
+    "multi_options": None,
+    "fixed_collection": (list,),
+    "json": None,  # any JSON-serializable
+    "tool_refs": (list,),
+    "document_refs": (list,),
+    "recording_ref": (str,),
+    "credential_ref": (str,),
+    "mention_textarea": (str,),
+    "url": (str,),
+}
+
+
+def _with_hint(prop: dict[str, Any], message: str) -> str:
+    """Append `prop.llm_hint` to an error message when set.
+
+    Surfacing the hint inside validation errors lets an LLM author
+    self-correct on retry — it sees the catalog reference or value-shape
+    guidance inline with the failure.
+    """
+    hint = prop.get("llm_hint")
+    if hint:
+        return f"{message}\n  Hint: {hint}"
+    return message
+
+
+def _check_scalar(prop: dict[str, Any], value: Any) -> None:
+    # None is always allowed (missing value handled by required check).
+    if value is None:
+        return
+    allowed = _SCALAR_TYPES.get(prop["type"])
+    if allowed is None:
+        return
+    # Booleans ARE ints in Python, so exclude accidentally-matching bools.
+    if bool in allowed and not (int in allowed or float in allowed):
+        if not isinstance(value, bool):
+            raise ValidationError(
+                _with_hint(
+                    prop,
+                    f"{prop['name']}: expected boolean, got {type(value).__name__}",
+                )
+            )
+        return
+    if not isinstance(value, allowed):
+        raise ValidationError(
+            _with_hint(
+                prop,
+                f"{prop['name']}: expected {prop['type']}, "
+                f"got {type(value).__name__}",
+            )
+        )
+
+
+def _check_options(prop: dict[str, Any], value: Any) -> None:
+    if value is None:
+        return
+    allowed = {o["value"] for o in prop.get("options") or []}
+    if not allowed:
+        return
+    if prop["type"] == "multi_options":
+        if not isinstance(value, list):
+            raise ValidationError(
+                _with_hint(
+                    prop,
+                    f"{prop['name']}: expected list, got {type(value).__name__}",
+                )
+            )
+        bad = [v for v in value if v not in allowed]
+        if bad:
+            raise ValidationError(
+                _with_hint(
+                    prop,
+                    f"{prop['name']}: values {bad} not in allowed {sorted(allowed)}",
+                )
+            )
+    else:  # 'options'
+        if value not in allowed:
+            raise ValidationError(
+                _with_hint(
+                    prop,
+                    f"{prop['name']}: {value!r} not in allowed {sorted(allowed)}",
+                )
+            )
+
+
+def validate_node_data(
+    spec: dict[str, Any],
+    kwargs: dict[str, Any],
+) -> dict[str, Any]:
+    """Validate LLM-supplied kwargs against the node spec. Returns the data
+    dict to embed in the wire format, with defaults applied.
+
+    Raises:
+        ValidationError if kwargs contain unknown fields, omit required
+        fields, or carry obvious type mismatches.
+    """
+    declared = {p["name"]: p for p in spec["properties"]}
+
+    # Unknown field names — the most common LLM hallucination.
+    unknown = set(kwargs) - set(declared)
+    if unknown:
+        raise ValidationError(
+            f"{spec['name']}: unknown field(s) {sorted(unknown)}. "
+            f"Allowed: {sorted(declared)}"
+        )
+
+    # Per-property validation
+    data: dict[str, Any] = {}
+    for name, prop in declared.items():
+        if name in kwargs:
+            value = kwargs[name]
+        elif prop.get("default") is not None:
+            value = prop["default"]
+        else:
+            value = None
+
+        # Scalar / collection shape
+        if prop["type"] in ("options", "multi_options"):
+            _check_options(prop, value)
+        else:
+            _check_scalar(prop, value)
+
+        # Nested fixed_collection rows — validate each row as a sub-spec.
+        if prop["type"] == "fixed_collection" and isinstance(value, list):
+            sub_spec = {"name": f"{spec['name']}.{name}", "properties": prop.get("properties") or []}
+            data[name] = [validate_node_data(sub_spec, row) for row in value]
+            continue
+
+        if value is not None:
+            data[name] = value
+
+    # Required check — must be set AND non-empty for strings.
+    for name, prop in declared.items():
+        if not prop.get("required"):
+            continue
+        val = data.get(name)
+        if val is None or (isinstance(val, str) and val.strip() == ""):
+            raise ValidationError(
+                _with_hint(
+                    prop,
+                    f"{spec['name']}: required field missing: {name}",
+                )
+            )
+
+    return data
--- a/sdk/python/src/dograh_sdk/client.py
+++ b/sdk/python/src/dograh_sdk/client.py
@ -0,0 +1,151 @@
+"""HTTP client for the Dograh REST API.
+
+Most endpoint methods come from `_GeneratedClient` (auto-generated from
+the FastAPI OpenAPI spec — see `scripts/generate_sdk.sh`). This class
+adds the session/auth/cache surface around that mixin plus a couple of
+ergonomic wrappers (`load_workflow`, `save_workflow`) that compose a
+generated call with local `Workflow` hydration.
+
+The SDK surface on the backend is controlled by decorating routes with
+`@sdk_expose(method="...")`; anything else is invisible here.
+"""
+
+from __future__ import annotations
+
+import os
+from typing import Any
+
+import httpx
+
+from ._generated_client import _GeneratedClient
+from ._generated_models import (
+    NodeSpec,
+    NodeTypesResponse,
+    UpdateWorkflowRequest,
+    WorkflowResponse,
+)
+from .errors import ApiError, SpecMismatchError
+from .workflow import Workflow
+
+
+class DograhClient(_GeneratedClient):
+    """Sync HTTP client. Suitable for scripts, pytest, and the LLM SDK
+    exec sandbox.
+
+    Auth precedence:
+        1. `api_key` kwarg
+        2. `DOGRAH_API_KEY` env var
+        3. unauthenticated (most endpoints will 401)
+    """
+
+    def __init__(
+        self,
+        *,
+        base_url: str | None = None,
+        api_key: str | None = None,
+        timeout: float = 30.0,
+    ):
+        resolved_url = base_url or os.environ.get(
+            "DOGRAH_API_URL", "http://localhost:8000"
+        )
+        self.base_url = resolved_url.rstrip("/")
+        self.api_key = api_key or os.environ.get("DOGRAH_API_KEY")
+
+        headers = {"Accept": "application/json"}
+        if self.api_key:
+            headers["X-API-Key"] = self.api_key
+
+        self._http = httpx.Client(
+            base_url=f"{self.base_url}/api/v1",
+            headers=headers,
+            timeout=timeout,
+        )
+
+        # Populated by the first call to `list_node_types` / `get_node_type`
+        # — avoids repeated round-trips when building a workflow.
+        self._spec_cache: dict[str, NodeSpec] = {}
+        self._spec_version: str | None = None
+
+    def close(self) -> None:
+        self._http.close()
+
+    def __enter__(self) -> DograhClient:
+        return self
+
+    def __exit__(self, *args: Any) -> None:
+        self.close()
+
+    @property
+    def spec_version(self) -> str | None:
+        """Contract version reported by the server, or None until the
+        first `list_node_types` / `get_node_type` call."""
+        return self._spec_version
+
+    # ── spec discovery overrides (generated methods + caching) ────────
+
+    def list_node_types(self) -> NodeTypesResponse:
+        resp = super().list_node_types()
+        self._spec_version = resp.spec_version
+        for spec in resp.node_types:
+            self._spec_cache[spec.name] = spec
+        return resp
+
+    def get_node_type(self, name: str) -> NodeSpec:
+        cached = self._spec_cache.get(name)
+        if cached is not None:
+            return cached
+        try:
+            spec = super().get_node_type(name)
+        except ApiError as e:
+            if e.status_code == 404:
+                raise SpecMismatchError(f"Unknown node type: {name!r}") from e
+            raise
+        self._spec_cache[name] = spec
+        return spec
+
+    # ── ergonomic workflow wrappers ───────────────────────────────────
+
+    def load_workflow(self, workflow_id: int) -> Workflow:
+        """Fetch a workflow and hydrate it into an editable `Workflow` builder."""
+        resp = self.get_workflow(workflow_id)
+        if not resp.workflow_definition:
+            raise ApiError(
+                200,
+                f"Workflow {workflow_id} has no definition to load",
+                body=resp.model_dump(mode="json"),
+            )
+        return Workflow.from_json(
+            resp.workflow_definition, client=self, name=resp.name
+        )
+
+    def save_workflow(self, workflow_id: int, workflow: Workflow) -> WorkflowResponse:
+        """Persist a `Workflow` builder back to the server as a new draft."""
+        return self.update_workflow(
+            workflow_id,
+            body=UpdateWorkflowRequest(
+                name=workflow.name,
+                workflow_definition=workflow.to_json(),
+            ),
+        )
+
+    # ── low-level ──────────────────────────────────────────────────
+
+    def _request(self, method: str, path: str, **kwargs: Any) -> Any:
+        resp = self._http.request(method, path, **kwargs)
+        if resp.status_code >= 400:
+            try:
+                body = resp.json()
+                if isinstance(body, dict):
+                    message = body.get("detail") or body.get("message") or resp.text
+                else:
+                    message = resp.text
+            except ValueError:
+                body = resp.text
+                message = resp.text
+            raise ApiError(resp.status_code, message, body=body)
+        if resp.status_code == 204 or not resp.content:
+            return None
+        try:
+            return resp.json()
+        except ValueError:
+            return resp.text
--- a/Show more
+++ b/Show more