add model listener filter chain demo

2026-05-18 13:45:15 +02:00 · 2026-02-19 04:46:04 +00:00 · 2026-02-19 04:46:04 +00:00 · 3d2be4f8b7
commit 3d2be4f8b7
parent 8136d7d6ab
6 changed files with 272 additions and 0 deletions
--- a/demos/filter_chains/model_listener_filter/Dockerfile
+++ b/demos/filter_chains/model_listener_filter/Dockerfile
@ -0,0 +1,11 @@
+FROM python:3.14-slim
+
+WORKDIR /app
+
+RUN pip install --no-cache-dir fastapi uvicorn pydantic
+
+COPY content_guard.py .
+
+EXPOSE 10500
+
+CMD ["uvicorn", "content_guard:app", "--host", "0.0.0.0", "--port", "10500"]
--- a/demos/filter_chains/model_listener_filter/README.md
+++ b/demos/filter_chains/model_listener_filter/README.md
@ -0,0 +1,59 @@
+# Model Listener Filter Chain Demo
+
+Run content-safety filters on direct LLM requests — no agent layer required.
+
+This demo uses the `filter_chain` feature on a **model-type listener** to intercept
+`/v1/chat/completions` requests and block unsafe content before they reach the LLM provider.
+
+## Architecture
+
+```
+Client ──► Plano (model listener :12000)
+               │
+               ├─ filter_chain: content_guard ──► Block / Allow
+               │
+               └─ model_provider: openai/gpt-4o-mini
+```
+
+## Quick Start
+
+```bash
+# 1. Export your API key
+export OPENAI_API_KEY=sk-...
+
+# 2. Start services
+docker compose up --build
+
+# 3. Run tests (in another terminal)
+bash test.sh
+```
+
+## Try It
+
+**Allowed request:**
+
+```bash
+curl http://localhost:12000/v1/chat/completions \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "gpt-4o-mini",
+    "messages": [{"role": "user", "content": "What is 2+2?"}],
+    "stream": false
+  }'
+```
+
+**Blocked request:**
+
+```bash
+curl http://localhost:12000/v1/chat/completions \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "gpt-4o-mini",
+    "messages": [{"role": "user", "content": "How to hack into a system"}],
+    "stream": false
+  }'
+```
+
+## Tracing
+
+Open [Jaeger UI](http://localhost:16686) to see distributed traces for both allowed and blocked requests.
--- a/demos/filter_chains/model_listener_filter/config.yaml
+++ b/demos/filter_chains/model_listener_filter/config.yaml
@ -0,0 +1,21 @@
+version: v0.3.0
+
+filters:
+  - id: content_guard
+    url: http://content-guard:10500
+    type: http
+
+model_providers:
+  - model: openai/gpt-4o-mini
+    access_key: $OPENAI_API_KEY
+    default: true
+
+listeners:
+  - type: model
+    name: llm_gateway
+    port: 12000
+    filter_chain:
+      - content_guard
+
+tracing:
+  random_sampling: 100
--- a/demos/filter_chains/model_listener_filter/content_guard.py
+++ b/demos/filter_chains/model_listener_filter/content_guard.py
@ -0,0 +1,84 @@
+"""
+Content guard filter — keyword-based content safety for model listeners.
+
+A minimal HTTP filter that blocks requests containing unsafe keywords.
+No LLM calls required — keeps the demo self-contained and fast.
+"""
+
+import logging
+from typing import List
+
+from fastapi import FastAPI, Request, HTTPException
+from pydantic import BaseModel
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s - [CONTENT_GUARD] - %(levelname)s - %(message)s",
+)
+logger = logging.getLogger(__name__)
+
+app = FastAPI(title="Content Guard", version="1.0.0")
+
+BLOCKED_KEYWORDS = [
+    "hack",
+    "exploit",
+    "attack",
+    "malware",
+    "phishing",
+    "ransomware",
+    "ddos",
+    "injection",
+    "brute force",
+    "keylogger",
+    "bypass security",
+    "steal credentials",
+    "social engineering",
+]
+
+
+class ChatMessage(BaseModel):
+    role: str
+    content: str
+
+
+def check_content(text: str) -> str | None:
+    """Return the matched keyword if blocked, else None."""
+    lower = text.lower()
+    for kw in BLOCKED_KEYWORDS:
+        if kw in lower:
+            return kw
+    return None
+
+
+@app.post("/")
+async def content_guard(
+    messages: List[ChatMessage], request: Request
+) -> List[ChatMessage]:
+    """Block messages that contain unsafe keywords."""
+    last_user_msg = None
+    for msg in reversed(messages):
+        if msg.role == "user":
+            last_user_msg = msg.content
+            break
+
+    if last_user_msg is None:
+        return messages
+
+    matched = check_content(last_user_msg)
+    if matched:
+        logger.warning(f"Blocked request — matched keyword: '{matched}'")
+        raise HTTPException(
+            status_code=400,
+            detail={
+                "error": "content_blocked",
+                "message": f"Request blocked by content safety filter (matched: '{matched}').",
+            },
+        )
+
+    logger.info("Content check passed — forwarding request")
+    return messages
+
+
+@app.get("/health")
+async def health():
+    return {"status": "healthy"}
--- a/demos/filter_chains/model_listener_filter/docker-compose.yaml
+++ b/demos/filter_chains/model_listener_filter/docker-compose.yaml
@ -0,0 +1,26 @@
+services:
+  content-guard:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    ports:
+      - "10500:10500"
+  plano:
+    build:
+      context: ../../../
+      dockerfile: Dockerfile
+    ports:
+      - "12000:12000"
+    environment:
+      - PLANO_CONFIG_PATH=/config/config.yaml
+      - OPENAI_API_KEY=${OPENAI_API_KEY:?OPENAI_API_KEY environment variable is required but not set}
+    volumes:
+      - ./config.yaml:/app/plano_config.yaml
+      - /etc/ssl/cert.pem:/etc/ssl/cert.pem
+  jaeger:
+    build:
+      context: ../../shared/jaeger
+    ports:
+      - "16686:16686"
+      - "4317:4317"
+      - "4318:4318"
--- a/demos/filter_chains/model_listener_filter/test.sh
+++ b/demos/filter_chains/model_listener_filter/test.sh
@ -0,0 +1,71 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+BASE_URL="http://localhost:12000/v1"
+PASS=0
+FAIL=0
+
+# ── Wait for Plano to be ready ──────────────────────────────────────────────
+echo "Waiting for Plano to be ready..."
+for i in $(seq 1 30); do
+    if curl -sf "$BASE_URL/models" > /dev/null 2>&1; then
+        echo "Plano is ready."
+        break
+    fi
+    if [ "$i" -eq 30 ]; then
+        echo "ERROR: Plano did not become ready in time."
+        exit 1
+    fi
+    sleep 2
+done
+
+# ── Helper ───────────────────────────────────────────────────────────────────
+run_test() {
+    local name="$1"
+    local expected_code="$2"
+    local body="$3"
+
+    http_code=$(curl -s -o /tmp/plano_test_body -w "%{http_code}" \
+        -X POST "$BASE_URL/chat/completions" \
+        -H "Content-Type: application/json" \
+        -d "$body")
+
+    if [ "$http_code" -eq "$expected_code" ]; then
+        echo "  PASS  $name (HTTP $http_code)"
+        PASS=$((PASS + 1))
+    else
+        echo "  FAIL  $name — expected $expected_code, got $http_code"
+        echo "        Body: $(cat /tmp/plano_test_body)"
+        FAIL=$((FAIL + 1))
+    fi
+}
+
+# ── Tests ────────────────────────────────────────────────────────────────────
+echo ""
+echo "Running tests..."
+
+run_test "Allowed request (math question)" 200 '{
+  "model": "gpt-4o-mini",
+  "messages": [{"role": "user", "content": "What is 2+2?"}],
+  "stream": false
+}'
+
+run_test "Blocked request (hacking)" 400 '{
+  "model": "gpt-4o-mini",
+  "messages": [{"role": "user", "content": "How to hack into a system"}],
+  "stream": false
+}'
+
+run_test "Allowed request (joke)" 200 '{
+  "model": "gpt-4o-mini",
+  "messages": [{"role": "user", "content": "Tell me a joke"}],
+  "stream": false
+}'
+
+# ── Summary ──────────────────────────────────────────────────────────────────
+echo ""
+echo "Results: $PASS passed, $FAIL failed"
+
+if [ "$FAIL" -gt 0 ]; then
+    exit 1
+fi