added buffer_lock to prevent race condition in high concurrency scenarios
added documentation
This commit is contained in:
Alpha Nerd 2026-01-05 17:16:31 +01:00
parent 434b6d4cca
commit 20a016269d
9 changed files with 2167 additions and 42 deletions

View file

@ -0,0 +1,37 @@
# Sample NOMYO Router Configuration
# Basic single endpoint configuration
endpoints:
- http://localhost:11434
max_concurrent_connections: 2
# Multi-endpoint configuration with local Ollama instances
# endpoints:
# - http://ollama-worker1:11434
# - http://ollama-worker2:11434
# - http://ollama-worker3:11434
# Mixed configuration with Ollama and OpenAI endpoints
# endpoints:
# - http://localhost:11434
# - https://api.openai.com/v1
# API keys for remote endpoints
# Use ${VAR_NAME} syntax to reference environment variables
api_keys:
# Local Ollama instances typically don't require authentication
"http://localhost:11434": "ollama"
# Remote Ollama instances
# "http://remote-ollama:11434": "ollama"
# OpenAI API
# "https://api.openai.com/v1": "${OPENAI_KEY}"
# Anthropic API
# "https://api.anthropic.com/v1": "${ANTHROPIC_KEY}"
# Other OpenAI-compatible endpoints
# "https://api.mistral.ai/v1": "${MISTRAL_KEY}"