finalize feat:

Mixture of Experts: - prefix any ollama model with "moe-" on api/chat and the original user request gets passed to the selected model 3 times with temp=1 to get response variants. Each variant is then revisited and finally scored to find the best repsonse among them all and finally returned to the user. Runs longer, uses more tokens for expected better quality response.
2025-12-16 09:46:36 +01:00 · 2025-12-16 09:46:36 +01:00 · 434b6d4cca
commit 434b6d4cca
parent 19a13cc613
1 changed files with 25 additions and 14 deletions
--- a/enhance.py
+++ b/enhance.py
@ -9,30 +9,41 @@ def moe(query: str, query_id: int, response: str) -> str:
    User query: {query}
    query_id: {query_id}

-    The following is an assistant response to the original user query. Analyse the response, then critizise the response by discussing both strength and weakness of the response.
+    The following is an assistant response to the original user query. Analyse the response, then criticize the it by discussing both strengths and weaknesses. Do not add additional commentary.

    <assistant_response>
    {response}
    </assistant_response>
+
+    Respond in the format:
+    original_response
+    ---
+    Response Analysis:
+    your analysis
    """
    return moe_prompt

-def moe_select_candidate(query: str, candidates_with_feedback: list[str]) -> str:
+def moe_select_candidate(query: str, candidates: list[str]) -> str:
+    if not candidates:
+            raise ValueError("No candidates supplied")
+
+    candidate_sections = ""
+    for i, cand in enumerate(candidates[:3], start=0):
+        candidate_sections += f"""
+        <candidate_{i}>
+        {cand.message.content}
+        </candidate_{i}>
+        """
+
+    # Strict instruction: "Respond **only** with the final answer."
    select_prompt = f"""
    From the following responses for the user query: {query}
-    select the best fitting candidate and formulate a final anser for the user.

-    <candidate_0>
-    {candidates_with_feedback[0].message.content}
-    </candidate_0>
+    {candidate_sections}

-    <candidate_1>
-    {candidates_with_feedback[1].message.content}
-    </candidate_1>
-
-    <candidate_2>
-    {candidates_with_feedback[2].message.content}
-    </candidate_2>
+    Choose the best candidate and output the final answer in the language of the query.
+    **Do NOT** mention candidate numbers, strengths, weaknesses, or any other commentary.
+    Just give the final answer—nothing else.
    """
-    return select_prompt
+    return select_prompt.strip()