Merge pull request #1172 from seehi/feat-rag-embedding

Make RAG embedding configurable and add gpt-4-turbo in token_counter.
2026-06-20 15:38:09 +02:00 · 2024-04-10 15:59:31 +08:00 · 2024-04-10 15:59:31 +08:00 · 63ca5452bc
commit 63ca5452bc
parent 471d5be80c caa1300163
12 changed files with 268 additions and 37 deletions
--- a/config/config2.example.yaml
+++ b/config/config2.example.yaml
@ -13,6 +13,16 @@ llm:
  # - gpt-4 8k: "gpt-4"
  # See for more: https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/

+# RAG Embedding.
+# For backward compatibility, if the embedding is not set and the llm's api_type is either openai or azure, the llm's config will be used. 
+embedding:
+    api_type: "" # openai / azure / gemini / ollama etc. Check EmbeddingType for more options. 
+    base_url: ""
+    api_key: ""
+    model: ""
+    api_version: ""
+    embed_batch_size: 100
+
 repair_llm_output: true  # when the output is not a valid json, try to repair it

 proxy: "YOUR_PROXY"  # for tools like requests, playwright, selenium, etc.