feat(opencode): add dynamic model fetching for OpenAI-compatible providers

shivamashtikar · shivamashtikar · commit 66329b2e27bf · 2026-03-03T04:19:47.000+05:30
- Add fetch-models.ts module with OpenAI-compatible model fetching
- Add caching support with TTL for fetched models
- Add shouldFetchModels option to provider config (defaults to true)
- Update tests to disable model fetching in test fixtures
diff --git a/packages/opencode/src/provider/fetch-models.ts b/packages/opencode/src/provider/fetch-models.ts
@@ -0,0 +1,297 @@
+import { Global } from "../global"
+import { Log } from "../util/log"
+import path from "path"
+import { Installation } from "../installation"
+import type { ModelsDev } from "./models"
+
+const log = Log.create({ service: "fetch-models" })
+
+export namespace FetchModels {
+  export interface OpenAIModel {
+    id: string
+    object: string
+    created: number
+    owned_by: string
+  }
+
+  export interface OpenAIModelsResponse {
+    object: string
+    data: OpenAIModel[]
+  }
+
+  export interface FetchOptions {
+    baseURL: string
+    apiKey?: string
+    customEndpoint?: string
+    headers?: Record<string, string>
+  }
+
+  const cacheDir = path.join(Global.Path.cache, "fetched-models")
+
+  function getCacheFilePath(providerId: string): string {
+    return path.join(cacheDir, `${providerId}.json`)
+  }
+
+  function inferContextLimit(modelId: string): number {
+    const lower = modelId.toLowerCase()
+    // Check for explicit context size in name
+    const contextMatch = lower.match(/(\d+)[kkm](?=\b|[^a-z])/)
+    if (contextMatch) {
+      const num = parseInt(contextMatch[1])
+      if (lower.includes("m")) return num * 1000000
+      if (lower.includes("k")) return num * 1000
+    }
+    // Known model families
+    if (lower.includes("claude-3-opus") || lower.includes("claude-opus-4")) return 200000
+    if (lower.includes("claude-3-5-sonnet") || lower.includes("claude-sonnet-4")) return 200000
+    if (lower.includes("claude-3-haiku") || lower.includes("claude-haiku-4")) return 200000
+    if (lower.includes("claude-3")) return 200000
+    if (lower.includes("gpt-4o")) return 128000
+    if (lower.includes("gpt-4-turbo")) return 128000
+    if (lower.includes("gpt-4")) return 8192
+    if (lower.includes("gpt-3.5-turbo")) return 16385
+    if (lower.includes("gemini-1.5-pro") || lower.includes("gemini-3-pro")) return 2097152
+    if (lower.includes("gemini-1.5-flash") || lower.includes("gemini-3-flash")) return 1048576
+    if (lower.includes("gemini")) return 1048576
+    if (lower.includes("deepseek")) return 262144
+    if (lower.includes("llama-3.1") || lower.includes("llama-3-1")) return 128000
+    if (lower.includes("llama-3")) return 8192
+    if (lower.includes("mistral-large") || lower.includes("mistral-small")) return 128000
+    if (lower.includes("mixtral")) return 32768
+    if (lower.includes("kimi")) return 262144
+    return 128000 // Safe default
+  }
+
+  function inferOutputLimit(modelId: string): number {
+    const lower = modelId.toLowerCase()
+    if (lower.includes("claude-3-opus") || lower.includes("claude-opus-4")) return 32000
+    if (lower.includes("claude-3-5-sonnet") || lower.includes("claude-sonnet-4")) return 32000
+    if (lower.includes("claude-3-haiku") || lower.includes("claude-haiku-4")) return 32000
+    if (lower.includes("claude-3")) return 4096
+    if (lower.includes("gpt-4o")) return 16384
+    if (lower.includes("gpt-4-turbo")) return 4096
+    if (lower.includes("gpt-4")) return 8192
+    if (lower.includes("gemini-3")) return 32000
+    if (lower.includes("gemini-1.5")) return 8192
+    if (lower.includes("deepseek")) return 32000
+    if (lower.includes("kimi")) return 32000
+    return 4096 // Default
+  }
+
+  function inferAttachmentSupport(modelId: string): boolean {
+    const visionModels = [
+      "vision",
+      "claude-3",
+      "claude-opus-4",
+      "claude-sonnet-4",
+      "claude-haiku-4",
+      "gpt-4o",
+      "gemini",
+      "kimi",
+      "qwen-vl",
+      "multimodal",
+      "pixtral",
+      "llava",
+    ]
+    return visionModels.some((v) => modelId.toLowerCase().includes(v))
+  }
+
+  function inferReasoningSupport(modelId: string): boolean {
+    const reasoningModels = ["o1", "o3", "reasoning", "r1", "thinking", "deepseek-r1", "glm-flash-thinking"]
+    return reasoningModels.some((r) => modelId.toLowerCase().includes(r))
+  }
+
+  function inferToolCallSupport(modelId: string): boolean {
+    const noToolModels = ["embedding", "embed", "tts", "whisper", "moderation", "dall-e", "image", "audio"]
+    const hasNoTool = noToolModels.some((m) => modelId.toLowerCase().includes(m))
+    if (hasNoTool) return false
+
+    // Most modern models support tool calling
+    const modernModels = [
+      "claude-3",
+      "claude-opus-4",
+      "claude-sonnet-4",
+      "claude-haiku-4",
+      "gpt-4",
+      "gpt-3.5-turbo",
+      "gemini",
+      "mistral",
+      "mixtral",
+      "llama-3",
+      "kimi",
+      "deepseek",
+      "command-r",
+    ]
+    return modernModels.some((m) => modelId.toLowerCase().includes(m))
+  }
+
+  function inferModalities(modelId: string): { input: string[]; output: string[] } {
+    const lower = modelId.toLowerCase()
+    const isEmbedding = lower.includes("embedding") || lower.includes("embed")
+    const isTTS = lower.includes("tts") || lower.includes("whisper")
+    const isImageGen = lower.includes("dall-e") || lower.includes("image") || lower.includes("stable-diffusion")
+    const isVision = inferAttachmentSupport(modelId)
+
+    if (isEmbedding) {
+      return { input: ["text"], output: [] }
+    }
+    if (isTTS) {
+      return { input: ["text"], output: ["audio"] }
+    }
+    if (isImageGen) {
+      return { input: ["text"], output: ["image"] }
+    }
+
+    const input: string[] = ["text"]
+    if (isVision) input.push("image")
+
+    return { input, output: ["text"] }
+  }
+
+  function transformOpenAIModel(model: OpenAIModel): ModelsDev.Model {
+    const modalities = inferModalities(model.id)
+    const releaseDate = model.created ? new Date(model.created * 1000).toISOString().split("T")[0] : new Date().toISOString().split("T")[0]
+
+    return {
+      id: model.id,
+      name: model.id,
+      release_date: releaseDate,
+      attachment: inferAttachmentSupport(model.id),
+      reasoning: inferReasoningSupport(model.id),
+      temperature: true,
+      tool_call: inferToolCallSupport(model.id),
+      limit: {
+        context: inferContextLimit(model.id),
+        output: inferOutputLimit(model.id),
+      },
+      modalities: {
+        input: modalities.input as ("text" | "audio" | "image" | "video" | "pdf")[],
+        output: modalities.output as ("text" | "audio" | "image" | "video" | "pdf")[],
+      },
+      options: {},
+    }
+  }
+
+  export async function fetchFromEndpoint(options: FetchOptions): Promise<ModelsDev.Model[]> {
+    const endpoint = options.customEndpoint || `${options.baseURL.replace(/\/$/, "")}/v1/models`
+
+    log.info("Fetching models from endpoint", { endpoint })
+
+    const headers: Record<string, string> = {
+      "User-Agent": Installation.USER_AGENT,
+      ...options.headers,
+    }
+
+    if (options.apiKey) {
+      headers["Authorization"] = `Bearer ${options.apiKey}`
+    }
+
+    const response = await fetch(endpoint, {
+      headers,
+      signal: AbortSignal.timeout(30 * 1000), // 30 second timeout
+    })
+
+    if (!response.ok) {
+      const errorText = await response.text().catch(() => "Unknown error")
+      throw new Error(`Failed to fetch models: ${response.status} ${response.statusText} - ${errorText}`)
+    }
+
+    const data: OpenAIModelsResponse = await response.json()
+
+    if (!data.data || !Array.isArray(data.data)) {
+      throw new Error("Invalid response format: expected 'data' array")
+    }
+
+    log.info("Successfully fetched models", { count: data.data.length })
+
+    return data.data.map(transformOpenAIModel)
+  }
+
+  export interface CachedModels {
+    timestamp: number
+    models: ModelsDev.Model[]
+    ttl: number
+  }
+
+  export async function getCached(providerId: string, ttlMs: number = 60 * 60 * 1000): Promise<ModelsDev.Model[] | undefined> {
+    try {
+      const cacheFile = Bun.file(getCacheFilePath(providerId))
+      const exists = await cacheFile.exists()
+      if (!exists) return undefined
+
+      const cached: CachedModels = await cacheFile.json()
+      const now = Date.now()
+
+      if (now - cached.timestamp > (cached.ttl || ttlMs)) {
+        log.debug("Cache expired", { providerId })
+        return undefined
+      }
+
+      log.debug("Using cached models", { providerId, count: cached.models.length })
+      return cached.models
+    } catch (error) {
+      log.debug("Failed to read cache", { providerId, error })
+      return undefined
+    }
+  }
+
+  export async function setCached(providerId: string, models: ModelsDev.Model[], ttlMs: number = 60 * 60 * 1000): Promise<void> {
+    try {
+      // Ensure cache directory exists
+      await Bun.$`mkdir -p ${cacheDir}`.nothrow().quiet()
+
+      const cacheData: CachedModels = {
+        timestamp: Date.now(),
+        models,
+        ttl: ttlMs,
+      }
+
+      const cacheFile = getCacheFilePath(providerId)
+      await Bun.write(cacheFile, JSON.stringify(cacheData, null, 2))
+
+      log.debug("Cached models", { providerId, count: models.length })
+    } catch (error) {
+      log.warn("Failed to cache models", { providerId, error })
+    }
+  }
+
+  export async function fetchWithCache(
+    providerId: string,
+    options: FetchOptions,
+    cacheOptions?: { enabled?: boolean; ttlMs?: number }
+  ): Promise<ModelsDev.Model[]> {
+    const { enabled = true, ttlMs = 60 * 60 * 1000 } = cacheOptions || {}
+
+    if (enabled) {
+      const cached = await getCached(providerId, ttlMs)
+      if (cached) return cached
+    }
+
+    const models = await fetchFromEndpoint(options)
+
+    if (enabled) {
+      await setCached(providerId, models, ttlMs)
+    }
+
+    return models
+  }
+
+  export async function invalidateCache(providerId?: string): Promise<void> {
+    try {
+      if (providerId) {
+        const cacheFile = getCacheFilePath(providerId)
+        await Bun.file(cacheFile).delete().catch(() => {})
+        log.info("Invalidated cache for provider", { providerId })
+      } else {
+        // Invalidate all caches
+        const glob = new Bun.Glob("*.json")
+        for await (const file of glob.scan({ cwd: cacheDir })) {
+          await Bun.file(path.join(cacheDir, file)).delete().catch(() => {})
+        }
+        log.info("Invalidated all model caches")
+      }
+    } catch (error) {
+      log.warn("Failed to invalidate cache", { providerId, error })
+    }
+  }
+}
diff --git a/packages/opencode/test/session/llm.test.ts b/packages/opencode/test/session/llm.test.ts
@@ -134,7 +134,7 @@ beforeAll(() => {
       }
 
       const url = new URL(req.url)
-      const body = (await req.json()) as Record<string, unknown>
+      const body = req.method === "GET" ? {} : ((await req.json()) as Record<string, unknown>)
       next.resolve({ url, headers: req.headers, body })
 
       if (!url.pathname.endsWith(next.path)) {
@@ -250,6 +250,7 @@ describe("session.llm.stream", () => {
             enabled_providers: [providerID],
             provider: {
               [providerID]: {
+                shouldFetchModels: false,
                 options: {
                   apiKey: "test-key",
                   baseURL: `${server.url.origin}/v1`,
@@ -374,6 +375,7 @@ describe("session.llm.stream", () => {
             provider: {
               openai: {
                 name: "OpenAI",
+                shouldFetchModels: false,
                 env: ["OPENAI_API_KEY"],
                 npm: "@ai-sdk/openai",
                 api: "https://api.openai.com/v1",
@@ -502,6 +504,7 @@ describe("session.llm.stream", () => {
             enabled_providers: [providerID],
             provider: {
               [providerID]: {
+                shouldFetchModels: false,
                 options: {
                   apiKey: "test-anthropic-key",
                   baseURL: `${server.url.origin}/v1`,
@@ -603,6 +606,7 @@ describe("session.llm.stream", () => {
             enabled_providers: [providerID],
             provider: {
               [providerID]: {
+                shouldFetchModels: false,
                 options: {
                   apiKey: "test-google-key",
                   baseURL: `${server.url.origin}/v1beta`,