fix(types): remove model enum constraint in chat completions

stainless-app[bot] · stainless-app[bot] · commit c30e2a092988 · 2026-03-17T17:21:33.000Z
diff --git a/.stats.yml b/.stats.yml
@@ -1,4 +1,4 @@
 configured_endpoints: 74
-openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/togetherai%2Ftogetherai-17535cff686ac0b5c2d265ae3702954e58f9d5dfb7cc9b25c641f15d81a37877.yml
-openapi_spec_hash: aa6403bd0f77df741d96b2cb9064443a
+openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/togetherai%2Ftogetherai-59ee1b4dba9d98feae58f6f49eed513e8af43068176ab4dec7783cea9af44dee.yml
+openapi_spec_hash: 07cb012932e3337076a1e2a2ce4618b7
 config_hash: b66198d27b4d5c152688ff6cccfdeab5
diff --git a/README.md b/README.md
@@ -193,7 +193,7 @@ chat_completion = client.chat.completions.create(
             "role": "system",
         }
     ],
-    model="Qwen/Qwen3.5-9B",
+    model="model",
     reasoning={},
 )
 print(chat_completion.reasoning)
diff --git a/src/together/resources/chat/completions.py b/src/together/resources/chat/completions.py
@@ -2,7 +2,7 @@
 
 from __future__ import annotations
 
-from typing import Dict, Union, Iterable
+from typing import Dict, Iterable
 from typing_extensions import Literal, overload
 
 import httpx
@@ -52,16 +52,7 @@ def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
         context_length_exceeded_behavior: Literal["truncate", "error"] | Omit = omit,
@@ -207,16 +198,7 @@ def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         stream: Literal[True],
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
@@ -362,16 +344,7 @@ def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         stream: bool,
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
@@ -517,16 +490,7 @@ def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
         context_length_exceeded_behavior: Literal["truncate", "error"] | Omit = omit,
@@ -629,16 +593,7 @@ async def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
         context_length_exceeded_behavior: Literal["truncate", "error"] | Omit = omit,
@@ -784,16 +739,7 @@ async def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         stream: Literal[True],
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
@@ -939,16 +885,7 @@ async def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         stream: bool,
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
@@ -1094,16 +1031,7 @@ async def create(
         self,
         *,
         messages: Iterable[completion_create_params.Message],
-        model: Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ],
+        model: str,
         chat_template_kwargs: object | Omit = omit,
         compliance: Literal["hipaa"] | Omit = omit,
         context_length_exceeded_behavior: Literal["truncate", "error"] | Omit = omit,
diff --git a/src/together/resources/endpoints.py b/src/together/resources/endpoints.py
@@ -352,6 +352,7 @@ def list_hardware(
         Args:
           model: Filter hardware configurations by model compatibility. When provided, the
               response includes availability status for each compatible configuration.
+              [See all of Together AI's dedicated models](https://docs.together.ai/docs/dedicated-models)
 
           extra_headers: Send extra headers
 
@@ -693,6 +694,7 @@ async def list_hardware(
         Args:
           model: Filter hardware configurations by model compatibility. When provided, the
               response includes availability status for each compatible configuration.
+              [See all of Together AI's dedicated models](https://docs.together.ai/docs/dedicated-models)
 
           extra_headers: Send extra headers
 
diff --git a/src/together/types/chat/completion_create_params.py b/src/together/types/chat/completion_create_params.py
@@ -44,18 +44,7 @@ class CompletionCreateParamsBase(TypedDict, total=False):
     messages: Required[Iterable[Message]]
     """A list of messages comprising the conversation so far."""
 
-    model: Required[
-        Union[
-            Literal[
-                "Qwen/Qwen2.5-72B-Instruct-Turbo",
-                "Qwen/Qwen2.5-7B-Instruct-Turbo",
-                "Qwen/Qwen3.5-9B",
-                "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-            ],
-            str,
-        ]
-    ]
+    model: Required[str]
     """The name of the model to query.
 
     [See all of Together AI's chat models](https://docs.together.ai/docs/serverless-models#chat-models)
diff --git a/src/together/types/endpoint_list_hardware_params.py b/src/together/types/endpoint_list_hardware_params.py
@@ -13,4 +13,5 @@ class EndpointListHardwareParams(TypedDict, total=False):
 
     When provided, the response includes availability status for each compatible
     configuration.
+    [See all of Together AI's dedicated models](https://docs.together.ai/docs/dedicated-models)
     """
diff --git a/tests/api_resources/chat/test_completions.py b/tests/api_resources/chat/test_completions.py
@@ -26,7 +26,7 @@ def test_method_create_overload_1(self, client: Together) -> None:
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
         )
         assert_matches_type(ChatCompletion, completion, path=["response"])
 
@@ -40,7 +40,7 @@ def test_method_create_with_all_params_overload_1(self, client: Together) -> Non
                     "name": "name",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             chat_template_kwargs={},
             compliance="hipaa",
             context_length_exceeded_behavior="truncate",
@@ -90,7 +90,7 @@ def test_raw_response_create_overload_1(self, client: Together) -> None:
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
         )
 
         assert response.is_closed is True
@@ -107,7 +107,7 @@ def test_streaming_response_create_overload_1(self, client: Together) -> None:
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
         ) as response:
             assert not response.is_closed
             assert response.http_request.headers.get("X-Stainless-Lang") == "python"
@@ -126,7 +126,7 @@ def test_method_create_overload_2(self, client: Together) -> None:
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
         )
         completion_stream.response.close()
@@ -141,7 +141,7 @@ def test_method_create_with_all_params_overload_2(self, client: Together) -> Non
                     "name": "name",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
             chat_template_kwargs={},
             compliance="hipaa",
@@ -191,7 +191,7 @@ def test_raw_response_create_overload_2(self, client: Together) -> None:
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
         )
 
@@ -208,7 +208,7 @@ def test_streaming_response_create_overload_2(self, client: Together) -> None:
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
         ) as response:
             assert not response.is_closed
@@ -234,7 +234,7 @@ async def test_method_create_overload_1(self, async_client: AsyncTogether) -> No
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
         )
         assert_matches_type(ChatCompletion, completion, path=["response"])
 
@@ -248,7 +248,7 @@ async def test_method_create_with_all_params_overload_1(self, async_client: Asyn
                     "name": "name",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             chat_template_kwargs={},
             compliance="hipaa",
             context_length_exceeded_behavior="truncate",
@@ -298,7 +298,7 @@ async def test_raw_response_create_overload_1(self, async_client: AsyncTogether)
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
         )
 
         assert response.is_closed is True
@@ -315,7 +315,7 @@ async def test_streaming_response_create_overload_1(self, async_client: AsyncTog
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
         ) as response:
             assert not response.is_closed
             assert response.http_request.headers.get("X-Stainless-Lang") == "python"
@@ -334,7 +334,7 @@ async def test_method_create_overload_2(self, async_client: AsyncTogether) -> No
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
         )
         await completion_stream.response.aclose()
@@ -349,7 +349,7 @@ async def test_method_create_with_all_params_overload_2(self, async_client: Asyn
                     "name": "name",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
             chat_template_kwargs={},
             compliance="hipaa",
@@ -399,7 +399,7 @@ async def test_raw_response_create_overload_2(self, async_client: AsyncTogether)
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
         )
 
@@ -416,7 +416,7 @@ async def test_streaming_response_create_overload_2(self, async_client: AsyncTog
                     "role": "system",
                 }
             ],
-            model="Qwen/Qwen3.5-9B",
+            model="model",
             stream=True,
         ) as response:
             assert not response.is_closed
diff --git a/tests/api_resources/test_endpoints.py b/tests/api_resources/test_endpoints.py
diff --git a/tests/api_resources/test_evals.py b/tests/api_resources/test_evals.py
diff --git a/tests/test_client.py b/tests/test_client.py

Original file line number	Diff line number	Diff line change
`@@ -193,7 +193,7 @@ chat_completion = client.chat.completions.create(`
`193`	`193`	`"role": "system",`
`194`	`194`	`}`
`195`	`195`	`],`
`196`		`- model="Qwen/Qwen3.5-9B",`
	`196`	`+ model="model",`
`197`	`197`	`reasoning={},`
`198`	`198`	`)`
`199`	`199`	`print(chat_completion.reasoning)`
Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@ def test_method_create_overload_1(self, client: Together) -> None:`
`26`	`26`	`"role": "system",`
`27`	`27`	`}`
`28`	`28`	`],`
`29`		`- model="Qwen/Qwen3.5-9B",`
	`29`	`+ model="model",`
`30`	`30`	`)`
`31`	`31`	`assert_matches_type(ChatCompletion, completion, path=["response"])`
`32`	`32`
`@@ -40,7 +40,7 @@ def test_method_create_with_all_params_overload_1(self, client: Together) -> Non`
`40`	`40`	`"name": "name",`
`41`	`41`	`}`
`42`	`42`	`],`
`43`		`- model="Qwen/Qwen3.5-9B",`
	`43`	`+ model="model",`
`44`	`44`	`chat_template_kwargs={},`
`45`	`45`	`compliance="hipaa",`
`46`	`46`	`context_length_exceeded_behavior="truncate",`
`@@ -90,7 +90,7 @@ def test_raw_response_create_overload_1(self, client: Together) -> None:`
`90`	`90`	`"role": "system",`
`91`	`91`	`}`
`92`	`92`	`],`
`93`		`- model="Qwen/Qwen3.5-9B",`
	`93`	`+ model="model",`
`94`	`94`	`)`
`95`	`95`
`96`	`96`	`assert response.is_closed is True`
`@@ -107,7 +107,7 @@ def test_streaming_response_create_overload_1(self, client: Together) -> None:`
`107`	`107`	`"role": "system",`
`108`	`108`	`}`
`109`	`109`	`],`
`110`		`- model="Qwen/Qwen3.5-9B",`
	`110`	`+ model="model",`
`111`	`111`	`) as response:`
`112`	`112`	`assert not response.is_closed`
`113`	`113`	`assert response.http_request.headers.get("X-Stainless-Lang") == "python"`
`@@ -126,7 +126,7 @@ def test_method_create_overload_2(self, client: Together) -> None:`
`126`	`126`	`"role": "system",`
`127`	`127`	`}`
`128`	`128`	`],`
`129`		`- model="Qwen/Qwen3.5-9B",`
	`129`	`+ model="model",`
`130`	`130`	`stream=True,`
`131`	`131`	`)`
`132`	`132`	`completion_stream.response.close()`
`@@ -141,7 +141,7 @@ def test_method_create_with_all_params_overload_2(self, client: Together) -> Non`
`141`	`141`	`"name": "name",`
`142`	`142`	`}`
`143`	`143`	`],`
`144`		`- model="Qwen/Qwen3.5-9B",`
	`144`	`+ model="model",`
`145`	`145`	`stream=True,`
`146`	`146`	`chat_template_kwargs={},`
`147`	`147`	`compliance="hipaa",`
`@@ -191,7 +191,7 @@ def test_raw_response_create_overload_2(self, client: Together) -> None:`
`191`	`191`	`"role": "system",`
`192`	`192`	`}`
`193`	`193`	`],`
`194`		`- model="Qwen/Qwen3.5-9B",`
	`194`	`+ model="model",`
`195`	`195`	`stream=True,`
`196`	`196`	`)`
`197`	`197`
`@@ -208,7 +208,7 @@ def test_streaming_response_create_overload_2(self, client: Together) -> None:`
`208`	`208`	`"role": "system",`
`209`	`209`	`}`
`210`	`210`	`],`
`211`		`- model="Qwen/Qwen3.5-9B",`
	`211`	`+ model="model",`
`212`	`212`	`stream=True,`
`213`	`213`	`) as response:`
`214`	`214`	`assert not response.is_closed`
`@@ -234,7 +234,7 @@ async def test_method_create_overload_1(self, async_client: AsyncTogether) -> No`
`234`	`234`	`"role": "system",`
`235`	`235`	`}`
`236`	`236`	`],`
`237`		`- model="Qwen/Qwen3.5-9B",`
	`237`	`+ model="model",`
`238`	`238`	`)`
`239`	`239`	`assert_matches_type(ChatCompletion, completion, path=["response"])`
`240`	`240`
`@@ -248,7 +248,7 @@ async def test_method_create_with_all_params_overload_1(self, async_client: Asyn`
`248`	`248`	`"name": "name",`
`249`	`249`	`}`
`250`	`250`	`],`
`251`		`- model="Qwen/Qwen3.5-9B",`
	`251`	`+ model="model",`
`252`	`252`	`chat_template_kwargs={},`
`253`	`253`	`compliance="hipaa",`
`254`	`254`	`context_length_exceeded_behavior="truncate",`
`@@ -298,7 +298,7 @@ async def test_raw_response_create_overload_1(self, async_client: AsyncTogether)`
`298`	`298`	`"role": "system",`
`299`	`299`	`}`
`300`	`300`	`],`
`301`		`- model="Qwen/Qwen3.5-9B",`
	`301`	`+ model="model",`
`302`	`302`	`)`
`303`	`303`
`304`	`304`	`assert response.is_closed is True`
`@@ -315,7 +315,7 @@ async def test_streaming_response_create_overload_1(self, async_client: AsyncTog`
`315`	`315`	`"role": "system",`
`316`	`316`	`}`
`317`	`317`	`],`
`318`		`- model="Qwen/Qwen3.5-9B",`
	`318`	`+ model="model",`
`319`	`319`	`) as response:`
`320`	`320`	`assert not response.is_closed`
`321`	`321`	`assert response.http_request.headers.get("X-Stainless-Lang") == "python"`
`@@ -334,7 +334,7 @@ async def test_method_create_overload_2(self, async_client: AsyncTogether) -> No`
`334`	`334`	`"role": "system",`
`335`	`335`	`}`
`336`	`336`	`],`
`337`		`- model="Qwen/Qwen3.5-9B",`
	`337`	`+ model="model",`
`338`	`338`	`stream=True,`
`339`	`339`	`)`
`340`	`340`	`await completion_stream.response.aclose()`
`@@ -349,7 +349,7 @@ async def test_method_create_with_all_params_overload_2(self, async_client: Asyn`
`349`	`349`	`"name": "name",`
`350`	`350`	`}`
`351`	`351`	`],`
`352`		`- model="Qwen/Qwen3.5-9B",`
	`352`	`+ model="model",`
`353`	`353`	`stream=True,`
`354`	`354`	`chat_template_kwargs={},`
`355`	`355`	`compliance="hipaa",`
`@@ -399,7 +399,7 @@ async def test_raw_response_create_overload_2(self, async_client: AsyncTogether)`
`399`	`399`	`"role": "system",`
`400`	`400`	`}`
`401`	`401`	`],`
`402`		`- model="Qwen/Qwen3.5-9B",`
	`402`	`+ model="model",`
`403`	`403`	`stream=True,`
`404`	`404`	`)`
`405`	`405`
`@@ -416,7 +416,7 @@ async def test_streaming_response_create_overload_2(self, async_client: AsyncTog`
`416`	`416`	`"role": "system",`
`417`	`417`	`}`
`418`	`418`	`],`
`419`		`- model="Qwen/Qwen3.5-9B",`
	`419`	`+ model="model",`
`420`	`420`	`stream=True,`
`421`	`421`	`) as response:`
`422`	`422`	`assert not response.is_closed`