mirror of
https://github.com/katanemo/plano.git
synced 2026-04-25 00:36:34 +02:00
Improve demo experience (#28)
* Imrpove demo experience - generate envoy.yaml using jinja2 template * add todo * add config file
This commit is contained in:
parent
51d6213cdd
commit
6f6454069f
7 changed files with 124 additions and 36 deletions
41
envoyfilter/katanemo-config.yaml
Normal file
41
envoyfilter/katanemo-config.yaml
Normal file
|
|
@ -0,0 +1,41 @@
|
|||
default_prompt_endpoint: "127.0.0.1"
|
||||
load_balancing: "round_robin"
|
||||
timeout_ms: 5000
|
||||
|
||||
embedding_provider:
|
||||
name: "SentenceTransformer"
|
||||
model: "all-MiniLM-L6-v2"
|
||||
|
||||
llm_providers:
|
||||
|
||||
- name: "open-ai-gpt-4"
|
||||
api_key: "$OPEN_AI_API_KEY"
|
||||
model: gpt-4
|
||||
|
||||
prompt_targets:
|
||||
|
||||
- type: context_resolver
|
||||
name: weather_forecast
|
||||
few_shot_examples:
|
||||
- what is the weather in New York?
|
||||
- how is the weather in San Francisco?
|
||||
- what is the forecast in Chicago?
|
||||
entities:
|
||||
- name: city
|
||||
required: true
|
||||
- name: days
|
||||
endpoint:
|
||||
cluster: weatherhost
|
||||
path: /weather
|
||||
system_prompt: |
|
||||
You are a helpful weather forecaster. Use weater data that is provided to you. Please following following guidelines when responding to user queries:
|
||||
- Use farenheight for temperature
|
||||
- Use miles per hour for wind speed
|
||||
|
||||
#TODO: add support for adding custom clusters e.g.
|
||||
# clusters:
|
||||
# qdrant:
|
||||
# options:
|
||||
# - address: "qdrant"
|
||||
# - address: "weatherhost"
|
||||
# - port: 6333
|
||||
Loading…
Add table
Add a link
Reference in a new issue