feat(wren-ai-service): add support for new GPT-5 models in configuration files (ai-env-changed) (#1875)

yichieh-lu · cyyeh · web-flow · commit e4e4c9f31ccc · 2025-08-08T16:40:28.000+08:00
Co-authored-by: ChihYu Yeh &lt;chihyu.jimmy.yeh@gmail.com&gt;
diff --git a/deployment/kustomizations/base/cm.yaml b/deployment/kustomizations/base/cm.yaml
@@ -75,7 +75,24 @@ data:
         n: 1
         seed: 0
         temperature: 0
-
+    - model: gpt-5-nano-2025-08-07
+      context_window_size: 380000
+      kwargs:
+        max_completion_tokens: 4096
+        n: 1
+        seed: 0
+    - model: gpt-5-mini-2025-08-07
+      context_window_size: 380000
+      kwargs:
+        max_completion_tokens: 4096
+        n: 1
+        seed: 0
+    - model: gpt-5-2025-08-07
+      context_window_size: 380000
+      kwargs:
+        max_completion_tokens: 4096
+        n: 1
+        seed: 0
     ---
     type: embedder
     provider: litellm_embedder
diff --git a/docker/config.example.yaml b/docker/config.example.yaml
@@ -24,6 +24,24 @@ models:
       n: 1
       seed: 0
       temperature: 0
+  - model: gpt-5-nano-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
+  - model: gpt-5-mini-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
+  - model: gpt-5-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
 
 ---
 type: embedder
diff --git a/wren-ai-service/poetry.lock b/wren-ai-service/poetry.lock
diff --git a/wren-ai-service/pyproject.toml b/wren-ai-service/pyproject.toml
@@ -10,7 +10,7 @@ package-mode = false
 [tool.poetry.dependencies]
 python = ">=3.12.*, <3.13"
 fastapi = "^0.115.2"
-uvicorn = {extras = ["standard"], version = "^0.30.1"}
+uvicorn = {extras = ["standard"], version = "^0.29.0"} # Litellm requires uvicorn < 0.30.0
 python-dotenv = "^1.0.1"
 haystack-ai = "==2.7.0"
 openai = "^1.40.0"
@@ -33,8 +33,8 @@ pydantic-settings = "^2.5.2"
 google-auth = "^2.35.0"
 tiktoken = "^0.8.0"
 jsonschema = "^4.23.0"
-litellm = "^1.70.0"
-boto3 = "^1.35.90"
+litellm = {extras = ["proxy"], version = "^1.75.2"}
+boto3 = "^1.34.34" # Litellm requires boto3 = 1.34.34
 qdrant-client = "==1.11.0"
 
 [tool.poetry.group.dev.dependencies]
diff --git a/wren-ai-service/tools/config/config.example.yaml b/wren-ai-service/tools/config/config.example.yaml
@@ -24,6 +24,24 @@ models:
       n: 1
       seed: 0
       temperature: 0
+  - model: gpt-5-nano-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
+  - model: gpt-5-mini-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
+  - model: gpt-5-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
 
 ---
 type: embedder
diff --git a/wren-ai-service/tools/config/config.full.yaml b/wren-ai-service/tools/config/config.full.yaml
@@ -24,6 +24,24 @@ models:
       n: 1
       seed: 0
       temperature: 0
+  - model: gpt-5-nano-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
+  - model: gpt-5-mini-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
+  - model: gpt-5-2025-08-07
+    context_window_size: 380000
+    kwargs:
+      max_completion_tokens: 4096
+      n: 1
+      seed: 0
 
 ---
 type: embedder
diff --git a/wren-launcher/commands/launch.go b/wren-launcher/commands/launch.go
@@ -109,7 +109,7 @@ func askForGenerationModel() (string, error) {
 
 	prompt := promptui.Select{
 		Label: "Select an OpenAI's generation model",
-		Items: []string{"gpt-4.1", "gpt-4.1-mini", "gpt-4.1-nano"},
+		Items: []string{"gpt-4.1", "gpt-4.1-mini", "gpt-4.1-nano", "gpt-5", "gpt-5-mini", "gpt-5-nano"},
 	}
 
 	_, result, err := prompt.Run()
@@ -389,6 +389,9 @@ func getOpenaiGenerationModel() (string, bool) {
 			"gpt-4.1":      true,
 			"gpt-4.1-mini": true,
 			"gpt-4.1-nano": true,
+			"gpt-5":        true,
+			"gpt-5-mini":   true,
+			"gpt-5-nano":   true,
 		}
 		if !validModels[openaiGenerationModel] {
 			pterm.Error.Println("Invalid generation model", openaiGenerationModel)
diff --git a/wren-launcher/utils/docker.go b/wren-launcher/utils/docker.go
@@ -34,6 +34,9 @@ var generationModelToModelName = map[string]string{
 	"gpt-4.1":      "gpt-4.1-2025-04-14",
 	"gpt-4.1-mini": "gpt-4.1-mini-2025-04-14",
 	"gpt-4.1-nano": "gpt-4.1-nano-2025-04-14",
+	"gpt-5":        "gpt-5-2025-08-07",
+	"gpt-5-mini":   "gpt-5-mini-2025-08-07",
+	"gpt-5-nano":   "gpt-5-nano-2025-08-07",
 }
 
 func replaceEnvFileContent(content string, projectDir string, openaiApiKey string, openAIGenerationModel string, hostPort int, aiPort int, userUUID string, telemetryEnabled bool, platform string, localStorage string) string {

Original file line number	Diff line number	Diff line change
`@@ -34,6 +34,9 @@ var generationModelToModelName = map[string]string{`
`34`	`34`	`"gpt-4.1": "gpt-4.1-2025-04-14",`
`35`	`35`	`"gpt-4.1-mini": "gpt-4.1-mini-2025-04-14",`
`36`	`36`	`"gpt-4.1-nano": "gpt-4.1-nano-2025-04-14",`
	`37`	`+ "gpt-5": "gpt-5-2025-08-07",`
	`38`	`+ "gpt-5-mini": "gpt-5-mini-2025-08-07",`
	`39`	`+ "gpt-5-nano": "gpt-5-nano-2025-08-07",`
`37`	`40`	`}`
`38`	`41`
`39`	`42`	`func replaceEnvFileContent(content string, projectDir string, openaiApiKey string, openAIGenerationModel string, hostPort int, aiPort int, userUUID string, telemetryEnabled bool, platform string, localStorage string) string {`