[Feature] Configurable slections for AI Managed mode

amidabuddha · amidabuddha · commit f32de4dbecf7 · 2025-06-21T09:53:16.000+03:00
diff --git a/config.toml.sample b/config.toml.sample
@@ -15,8 +15,14 @@ fallback_char = "?"
 temperature = 1
 system_role = "assistant"
 model = "gemini-pro-exp"
-assistant = "o4-mini"
-assistant_role = "<instructions>\nInstructions for AI Assistant:\n\n- Select the optimal AI model to answer user questions based on their complexity and nature.\n- Provide your response only in JSON format, strictly following the example below.\n- The \"system\" message should contain clear, guiding instructions for the selected AI model, without sharing your reasoning or including your own answer or opinion.\n\n<example>\n{\n    \"model\": \"{{selected_model}}\",\n    \"messages\": [\n        {\"role\": \"system\", \"content\": \"{{system_instruction_to_ai_model}}\"}\n    ]\n}\n</example>\n\nEvaluation Criteria:\n\n1. Analyze the user's question based on topic, required depth of knowledge, and length.\n2. Select the most suitable model from the options, considering capabilities and cost-effectiveness.\n3. Use the tables below to guide your model selection.\n\n<table1>\n| Model Name     | Input Cost ($/1M tokens) | Output Cost ($/1M tokens) | Remarks                                                   |\n|----------------|--------------------------|---------------------------|-----------------------------------------------------------|\n| gpt-41 | 2.00                     | 8.00                     | High-intelligence model for complex, multi-step tasks.     |\n| gpt-41-mini   | 0.40                     | 1.60                      | Affordable, intelligent model for fast, lightweight tasks. |\n| o3             | 2.00                    | 8.00                     | Advanced reasoning model for solving hard problems across domains.   |\n| o4-mini        | 1.10                     | 4.40                     | Efficient reasoning in coding, math, and science.          |\n</table1>\n\nModels are ranked from highest to lowest capability. Only suggest the best-fitting model.\n\n<table2>\n| Category                               | Model to Consider  |\n|----------------------------------------|--------------------|\n| Math, Science, Coding                  | o4-mini            |\n| One-shot (deep reasoning with context) | o3                 |\n| Multi-turn, complex conversations with reasoning      | gpt-41     |\n| Complex tasks, problem solving across domains.                       | gpt-41     |\n| Common Tasks, General Topics           | gpt-41-mini       |\n</table2>\n\nNotes:\n\n- Do not include explanations or clarifications outside the JSON response.\n- Optimize query handling, model capability, and cost in your decision.\n</instructions>"
+
+[chat.managed]
+assistant = "gpt-4o-mini"
+assistant_role = "<instructions>\nInstructions for AI Assistant:\n\n- Select the optimal AI model to answer user questions based on their complexity and nature.\n- Provide your response only in JSON format, strictly following the example below.\n- The \"system\" message should contain clear, guiding instructions for the selected AI model, without sharing your reasoning or including your own answer or opinion.\n\n<example>\n{\n    \"model\": \"{{selected_model}}\",\n    \"messages\": [\n        {\"role\": \"system\", \"content\": \"{{system_instruction_to_ai_model}}\"}\n    ]\n}\n</example>\n\nEvaluation Criteria:\n\n1. Analyze the user's question based on topic, required depth of knowledge, and length.\n2. Select the most suitable model from the options, considering capabilities and cost-effectiveness.\n3. Use the tables below to guide your model selection.\n\n<table1>\n| Model Name | Cost | Remarks |\n|-|-|-|-|\n| {{assistant_generalist}} | Highest | High-intelligence model for complex, multi-step tasks. |\n| {{assistant_fast}} | Cheapest | Affordable, intelligent model for fast, lightweight tasks. |\n| {{assistant_thinker}} | Highest | Advanced reasoning model for solving hard problems across domains. |\n| {{assistant_coder}} | Medium | Efficient reasoning in coding, math, and science. |\n</table1>\n\nModels are ranked from highest to lowest capability. Only suggest the best-fitting model.\n\n<table2>\n| Category | Model to Consider |\n|-|-|\n| Math, Science, Coding | {{assistant_coder}} |\n| One-shot (deep reasoning with context) | {{assistant_thinker}} |\n| Multi-turn, complex conversations with reasoning | {{assistant_generalist}} |\n| Complex tasks, problem solving across domains. | {{assistant_generalist}} |\n| Common Tasks, General Topics | {{assistant_fast}} |\n</table2>\n\nNotes:\n\n- Do not include explanations or clarifications outside the JSON response.\n- Optimize query handling, model capability, and cost in your decision.\n</instructions>"
+assistant_generalist = "gpt-41"
+assistant_fast = "gpt-41-mini"
+assistant_thinker = "o3"
+assistant_coder = "o4-mini"
 
 [chat.features]
 model_selector = true
diff --git a/console_gpt/menus/ai_managed.py b/console_gpt/menus/ai_managed.py
@@ -1,6 +1,8 @@
 import json
+from pyexpat import model
 from typing import Tuple
 
+from httpx import get
 from rich.console import Console
 from unichat import UnifiedChatApi
 
@@ -14,45 +16,13 @@
 from console_gpt.prompts.temperature_prompt import temperature_prompt
 from console_gpt.prompts.user_prompt import chat_user_prompt
 
-tools = [
-    {
-        "name": "managed_prompt",
-        "description": "Selects optimal AI model and generates appropriate system instructions based on user query analysis",
-        "inputSchema": {
-            "type": "object",
-            "properties": {
-                "model": {
-                    "type": "string",
-                    "enum": ["gpt-41", "gpt-41-mini", "o3", "o4-mini"],
-                    "description": "The selected AI model based on query analysis",
-                },
-                "messages": {
-                    "type": "array",
-                    "items": {
-                        "type": "object",
-                        "properties": {
-                            "role": {
-                                "type": "string",
-                                "enum": ["system"],
-                                "description": "The role of the message, only system messages are allowed",
-                            },
-                            "content": {
-                                "type": "string",
-                                "description": "The system instruction for the selected AI model",
-                            },
-                        },
-                        "required": ["role", "content"],
-                    },
-                    "minItems": 1,
-                    "maxItems": 1,
-                },
-            },
-            "required": ["model", "messages"],
-        },
-    }
+MODEL_KEYS = [
+    "{{assistant_generalist}}",
+    "{{assistant_fast}}",
+    "{{assistant_thinker}}",
+    "{{assistant_coder}}",
 ]
 
-
 def managed_prompt() -> Tuple[ChatObject, str]:
     """
     Use assistant help to determine the best model and fromat for the query
@@ -69,13 +39,14 @@ def managed_prompt() -> Tuple[ChatObject, str]:
 
 
 def configure_assistant():
-    assistant_model = fetch_variable("defaults", "assistant")
-    assistant_role = fetch_variable("defaults", "assistant_role")
+    assistant_model = fetch_variable("managed", "assistant")
+    assistant_role = fetch_variable("managed", "assistant_role")
+    replacements = {key: fetch_variable("managed", key.strip("{}")) for key in MODEL_KEYS}
+    for key, value in replacements.items():
+        assistant_role = assistant_role.replace(key, value)
     model_data = fetch_variable("models", assistant_model)
-    model_data.update(dict(model_title=assistant_model))
-    model_data.update(dict(role=assistant_role))
-    model_data = update_api_key_if_placeholder(model_data)
-    return model_data
+    model_data.update(model_title=assistant_model, role=assistant_role)
+    return update_api_key_if_placeholder(model_data)
 
 
 def update_api_key_if_placeholder(model_data):
@@ -95,6 +66,50 @@ def get_client(assistant):
     return UnifiedChatApi(**assistant_params)
 
 
+def get_tools_schema():
+    """
+    Dynamically generate the tools schema with the current model names from config.
+    """
+    model_names = [fetch_variable("managed", key.strip("{}")) for key in MODEL_KEYS]
+    return [
+        {
+            "name": "managed_prompt",
+            "description": "Selects optimal AI model and generates appropriate system instructions based on user query analysis",
+            "inputSchema": {
+                "type": "object",
+                "properties": {
+                    "model": {
+                        "type": "string",
+                        "enum": model_names,
+                        "description": "The selected AI model based on query analysis",
+                    },
+                    "messages": {
+                        "type": "array",
+                        "items": {
+                            "type": "object",
+                            "properties": {
+                                "role": {
+                                    "type": "string",
+                                    "enum": ["system"],
+                                    "description": "The role of the message, only system messages are allowed",
+                                },
+                                "content": {
+                                    "type": "string",
+                                    "description": "The system instruction for the selected AI model",
+                                },
+                            },
+                            "required": ["role", "content"],
+                        },
+                        "minItems": 1,
+                        "maxItems": 1,
+                    },
+                },
+                "required": ["model", "messages"],
+            },
+        }
+    ]
+
+
 @sigint_wrapper
 def send_request(client, assistant, conversation):
     if "reasoning_effort" in assistant:
@@ -107,7 +122,7 @@ def send_request(client, assistant, conversation):
         model=assistant["model_name"],
         messages=conversation,
         stream=False,
-        tools=tools,
+        tools=get_tools_schema(),
         reasoning_effort=reasoning_effort,
     )
     return response.choices[0].message.tool_calls
diff --git a/console_gpt/menus/model_menu.py b/console_gpt/menus/model_menu.py
@@ -26,7 +26,7 @@ def model_menu() -> Dict[str, Union[int, str, float]]:
 
     # Fetches the default model
     default_model = fetch_variable("defaults", "model")
-    default_assistant = fetch_variable("defaults", "assistant")
+    default_assistant = fetch_variable("managed", "assistant")
     all_models = fetch_variable("models")
 
     # Add new options for model management