make context length configurable

2026-05-05 05:42:37 +02:00 · 2024-10-28 21:12:09 +08:00 · 2024-10-28 21:12:09 +08:00 · 7b81c8a690
commit 7b81c8a690
parent 8b209d4e17
2 changed files with 4 additions and 1 deletions
--- a/metagpt/configs/llm_config.py
+++ b/metagpt/configs/llm_config.py
@ -83,6 +83,7 @@ class LLMConfig(YamlModel):
    logprobs: Optional[bool] = None
    top_logprobs: Optional[int] = None
    timeout: int = 600
+    context_length: Optional[int] = None  # Max input tokens

    # For Amazon Bedrock
    region_name: str = None
--- a/metagpt/rag/factories/llm.py
+++ b/metagpt/rag/factories/llm.py
@ -23,10 +23,12 @@ class RAGLLM(CustomLLM):
    """LlamaIndex's LLM is different from MetaGPT's LLM.

    Inherit CustomLLM from llamaindex, making MetaGPT's LLM can be used by LlamaIndex.
+
+    Set context_length or max_token of LLM in config.yaml if you encounter "Calculated available context size -xxx was not non-negative" error.
    """

    model_infer: BaseLLM = Field(..., description="The MetaGPT's LLM.")
-    context_window: int = TOKEN_MAX.get(config.llm.model, DEFAULT_CONTEXT_WINDOW)
+    context_window: int = config.llm.context_length or TOKEN_MAX.get(config.llm.model, DEFAULT_CONTEXT_WINDOW)
    num_output: int = config.llm.max_token
    model_name: str = config.llm.model