Merge remote-tracking branch 'origin/main' into devin/1764806701-keyterms-multilingual-support

devin-ai-integration[bot] · devin-ai-integration[bot] · commit 451779f00595 · 2025-12-04T01:11:38.000Z
diff --git a/fern/.definition/__package__.yml b/fern/.definition/__package__.yml
@@ -52,3 +52,10 @@ errors:
           error: Authentication error, API token missing/invalid
     status-code: 401
     type: Error
+  CannotAccessUploadedFileError:
+    docs: Cannot access uploaded file
+    examples:
+      - value:
+          error: Cannot access uploaded file
+    status-code: 403
+    type: Error
diff --git a/fern/.definition/files.yml b/fern/.definition/files.yml
@@ -21,10 +21,13 @@ service:
         <Note>To upload a media file to our EU server, replace
         `api.assemblyai.com` with `api.eu.assemblyai.com`.</Note>
 
+        <Warning>Requests to transcribe uploaded files must use an API key from the same project as the key that was used to upload the file. If you use an API key from a different project you will get a `403` error and "Cannot access uploaded file" message.</Warning>
+
         Upload a media file to AssemblyAI's servers.
       errors:
         - root.BadRequestError
         - root.UnauthorizedError
+        - root.CannotAccessUploadedFileError
         - root.NotFoundError
         - root.TooManyRequestsError
         - root.InternalServerError
diff --git a/fern/docs.yml b/fern/docs.yml
@@ -972,6 +972,9 @@ navigation:
               - page: Do you offer EU Data Residency?
                 path: pages/faq/privacy-security/do-you-offer-eu-data-residency.mdx
                 slug: /do-you-offer-eu-data-residency
+              - page: Do you offer self-hosted solutions?
+                path: pages/faq/privacy-security/do-you-offer-self-hosted-solutions.mdx
+                slug: /do-you-offer-self-hosted-solutions
               - page: Do you offer servers in the EU?
                 path: pages/faq/privacy-security/do-you-offer-servers-in-the-eu.mdx
                 slug: /do-you-offer-servers-in-the-eu
diff --git a/fern/pages/07-llm-gateway/llm-gateway.mdx b/fern/pages/07-llm-gateway/llm-gateway.mdx
@@ -20,34 +20,38 @@ The LLM Gateway provides access to 15+ models across major AI providers with sup
 
 ### Anthropic Claude
 
-| Model                 | Parameter                    | Latency per 10,000 tokens | [LMArena Score](https://lmarena.ai/leaderboard) | Description                                            |
-| --------------------- | ---------------------------- | ------------------------- | ------------- | ------------------------------------------------------ |
-| **Claude 4.5 Sonnet** | `claude-sonnet-4-5-20250929` | 10.1s                     | 1444          | Claude's best model for complex agents and coding      |
-| **Claude 4 Sonnet**   | `claude-sonnet-4-20250514`   | 7.1s                      | 1389          | High-performance model                                 |
-| **Claude 4 Opus**     | `claude-opus-4-20250514`     | 15.4s                     | 1412          | Claude's previous flagship model                       |
-| **Claude 4.5 Haiku**  | `claude-haiku-4-5-20251001`  | 4.6s                      | 1402          | Claude's fastest and most intelligent Haiku model      |
-| **Claude 3.5 Haiku**  | `claude-3-5-haiku-20241022`  | 5.4s                      | 1322          | Fast and efficient model with strong performance       |
-| **Claude 3.0 Haiku**  | `claude-3-haiku-20240307`    | 4.8s                      | 1262          | Fast and compact model for near-instant responsiveness |
+| Model                 | Parameter                    | Latency per 10,000 tokens | [LMArena Score](https://lmarena.ai/leaderboard) | Description          | Retention Policy | Anthropic Model Training |
+| --------------------- | ---------------------------- | ------------------------- | ------------- | ------------------------------------------------------ | ---------------- | ------------------------ |
+| **Claude 4.5 Sonnet** | `claude-sonnet-4-5-20250929` | 10.1s                     | 1444          | Claude's best model for complex agents and coding      | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies.* | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Claude 4 Sonnet**   | `claude-sonnet-4-20250514`   | 7.1s                      | 1389          | High-performance model                                 | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies.* | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Claude 4 Opus**     | `claude-opus-4-20250514`     | 15.4s                     | 1412          | Claude's previous flagship model                       | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies.* | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Claude 4.5 Haiku**  | `claude-haiku-4-5-20251001`  | 4.6s                      | 1402          | Claude's fastest and most intelligent Haiku model      | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies.* | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Claude 3.5 Haiku**  | `claude-3-5-haiku-20241022`  | 5.4s                      | 1322          | Fast and efficient model with strong performance       | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies.* | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Claude 3.0 Haiku**  | `claude-3-haiku-20240307`    | 4.8s                      | 1262          | Fast and compact model for near-instant responsiveness | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies.* | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+
+<Note>
+  *If Amazon Bedrock fails, for non-EU customers we may send your request to the Anthropic API, where we have 0-day retention configured. Please see Anthropic's commercial terms [here](https://www.anthropic.com/legal/commercial-terms).
+</Note>
 
 ### OpenAI GPT
 
-| Model            | Parameter           | Latency per 10,000 tokens | [LMArena Score](https://lmarena.ai/leaderboard) | Description                                                      |
-| ---------------- | ------------------- | ------------------------- | ------------- | ---------------------------------------------------------------- |
-| **GPT-5**        | `gpt-5`             | 18.9s                     | 1425          | OpenAI's best model for coding and agentic tasks across domains  |
-| **GPT-5 nano**   | `gpt-5-nano`        | 11.2s                     | 1338          | OpenAI's fastest, most cost-efficient version of GPT-5           |
-| **GPT-5 mini**   | `gpt-5-mini`        | 21.9s                     | 1393          | A faster, cost-efficient version of GPT-5 for well-defined tasks |
-| **GPT-4.1**      | `gpt-4.1`           | 12.6s                     | 1412          | OpenAI's smartest non-reasoning model                            |
-| **gpt-oss-120b** | `gpt-oss-120b`      | 10.5s                     | 1352          | OpenAI's most powerful open-weight model                         |
-| **gpt-oss-20b**  | `gpt-oss-20b`       | 4.2s                      | 1318          | Medium-sized open-weight model for low latency                   |
+| Model            | Parameter           | Latency per 10,000 tokens | [LMArena Score](https://lmarena.ai/leaderboard) | Description                    | Retention Policy | OpenAI Model Training |
+| ---------------- | ------------------- | ------------------------- | ------------- | ---------------------------------------------------------------- | ---------------- | --------------------- |
+| **GPT-5**        | `gpt-5`             | 18.9s                     | 1425          | OpenAI's best model for coding and agentic tasks across domains  | Abuse monitoring retains logs for 30 days. If you require ZDR, please use Anthropic or Google models. | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **GPT-5 nano**   | `gpt-5-nano`        | 11.2s                     | 1338          | OpenAI's fastest, most cost-efficient version of GPT-5           | Abuse monitoring retains logs for 30 days. If you require ZDR, please use Anthropic or Google models. | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **GPT-5 mini**   | `gpt-5-mini`        | 21.9s                     | 1393          | A faster, cost-efficient version of GPT-5 for well-defined tasks | Abuse monitoring retains logs for 30 days. If you require ZDR, please use Anthropic or Google models. | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **GPT-4.1**      | `gpt-4.1`           | 12.6s                     | 1412          | OpenAI's smartest non-reasoning model                            | Abuse monitoring retains logs for 30 days. If you require ZDR, please use Anthropic or Google models. | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **gpt-oss-120b** | `gpt-oss-120b`      | 10.5s                     | 1352          | OpenAI's most powerful open-weight model                         | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies. | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **gpt-oss-20b**  | `gpt-oss-20b`       | 4.2s                      | 1318          | Medium-sized open-weight model for low latency                   | We use this model through Amazon Bedrock. Amazon Bedrock doesn't store or log your prompts and completions. Amazon Bedrock doesn't use your prompts and completions to train any AWS models and doesn't distribute them to third parties. See [here](https://docs.aws.amazon.com/bedrock/latest/userguide/data-protection.html) for more information on Amazon Bedrock data protection policies. | AssemblyAI has opted out of model training with all LLM Gateway providers. |
 
 ### Google Gemini
 
-| Model                     | Parameter               | Latency per 10,000 tokens | [LMArena Score](https://lmarena.ai/leaderboard) | Description                                                                           |
-| ------------------------- | ----------------------- | ------------------------- | ------------- | ------------------------------------------------------------------------------------- |
-| **Gemini 3 Pro Preview**  | `gemini-3-pro-preview`  | TBD                       | 1495          | Gemini's most powerful agentic and vibe-coding model, delivering richer visuals and deeper interactivity |
-| **Gemini 2.5 Pro**        | `gemini-2.5-pro`        | 13.9s                     | 1451          | Gemini's state-of-the-art thinking model, capable of reasoning over complex problems                         |
-| **Gemini 2.5 Flash**      | `gemini-2.5-flash`      | 8.3s                      | 1407          | Gemini's best model in terms of price-performance, offering well-rounded capabilities                     |
-| **Gemini 2.5 Flash-Lite** | `gemini-2.5-flash-lite` | 1.6s                      | 1375          | Gemini's fastest flash model optimized for cost-efficiency and high throughput                       |
+| Model                     | Parameter               | Latency per 10,000 tokens | [LMArena Score](https://lmarena.ai/leaderboard) | Description                                                            | Retention Policy | Google Model Training |
+| ------------------------- | ----------------------- | ------------------------- | ------------- | -------------------------------------------------------------------------------------------------------- | ---------------- | -------------- |
+| **Gemini 3 Pro Preview**  | `gemini-3-pro-preview`  | TBD                       | 1495          | Gemini's most powerful agentic and vibe-coding model, delivering richer visuals and deeper interactivity | ZDR (see Google's policy [here](https://docs.cloud.google.com/vertex-ai/generative-ai/docs/vertex-ai-zero-data-retention) for more information on how Google defines ZDR) | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Gemini 2.5 Pro**        | `gemini-2.5-pro`        | 13.9s                     | 1451          | Gemini's state-of-the-art thinking model, capable of reasoning over complex problems                     | ZDR (see Google's policy [here](https://docs.cloud.google.com/vertex-ai/generative-ai/docs/vertex-ai-zero-data-retention) for more information on how Google defines ZDR) | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Gemini 2.5 Flash**      | `gemini-2.5-flash`      | 8.3s                      | 1407          | Gemini's best model in terms of price-performance, offering well-rounded capabilities                    | ZDR (see Google's policy [here](https://docs.cloud.google.com/vertex-ai/generative-ai/docs/vertex-ai-zero-data-retention) for more information on how Google defines ZDR) | AssemblyAI has opted out of model training with all LLM Gateway providers. |
+| **Gemini 2.5 Flash-Lite** | `gemini-2.5-flash-lite` | 1.6s                      | 1375          | Gemini's fastest flash model optimized for cost-efficiency and high throughput                           | ZDR (see Google's policy [here](https://docs.cloud.google.com/vertex-ai/generative-ai/docs/vertex-ai-zero-data-retention) for more information on how Google defines ZDR) | AssemblyAI has opted out of model training with all LLM Gateway providers. |
 
 Unsure which model to choose?
 
diff --git a/fern/pages/faq/privacy-security/do-you-offer-self-hosted-solutions.mdx b/fern/pages/faq/privacy-security/do-you-offer-self-hosted-solutions.mdx
@@ -0,0 +1,7 @@
+---
+title: "Do you offer self-hosted solutions?"
+---
+
+Yes, we offer self-hosted solutions for organizations that require greater control over their data and infrastructure. Our self-hosted options allow you to deploy our services within your own environment, ensuring compliance with your organization's security policies and regulatory requirements.
+
+[Contact our sales team](https://www.assemblyai.com/contact/sales) to discuss your specific needs and to learn more about our self-hosted offerings. 
diff --git a/openapi.json b/openapi.json
@@ -83,6 +83,9 @@
           "401": {
             "$ref": "#/components/responses/Unauthorized"
           },
+          "403": {
+            "$ref": "#/components/responses/CannotAccessUploadedFile"
+          },
           "404": {
             "$ref": "#/components/responses/NotFound"
           },
@@ -6802,6 +6805,20 @@
           }
         }
       },
+      "CannotAccessUploadedFile": {
+        "x-label": "Cannot access uploaded file",
+        "description": "Cannot access uploaded file",
+        "content": {
+          "application/json": {
+            "schema": {
+              "$ref": "#/components/schemas/Error"
+            },
+            "example": {
+              "error": "Cannot access uploaded file"
+            }
+          }
+        }
+      },
       "NotFound": {
         "x-label": "Not found",
         "description": "Not found",
diff --git a/openapi.yml b/openapi.yml
@@ -39,8 +39,10 @@ paths:
         - transcript
       summary: Upload a media file
       description: |
-        <Note>To upload a media file to our EU server, replace `api.assemblyai.com` with `api.eu.assemblyai.com`.</Note>
         Upload a media file to AssemblyAI's servers.
+
+        <Note>To upload a media file to our EU server, replace `api.assemblyai.com` with `api.eu.assemblyai.com`.</Note>
+        <Warning>Requests to transcribe uploaded files must use an API key from the same project as the key that was used to upload the file. If you use an API key from a different project you will get a `403` error and "Cannot access uploaded file" message.</Warning>
       operationId: uploadFile
       x-fern-sdk-group-name: files
       x-fern-sdk-method-name: upload
@@ -62,6 +64,8 @@ paths:
           $ref: "#/components/responses/BadRequest"
         "401":
           $ref: "#/components/responses/Unauthorized"
+        "403":
+          $ref: "#/components/responses/CannotAccessUploadedFile"
         "404":
           $ref: "#/components/responses/NotFound"
         "429":
@@ -6276,6 +6280,14 @@ components:
             $ref: "#/components/schemas/Error"
           example:
             { "error": "Authentication error, API token missing/invalid" }
+    CannotAccessUploadedFile:
+      x-label: Cannot access uploaded file
+      description: Cannot access uploaded file
+      content:
+        application/json:
+          schema:
+            $ref: "#/components/schemas/Error"
+          example: { "error": "Cannot access uploaded file" }
     NotFound:
       x-label: Not found
       description: Not found