cleanlab · kelsey-wong · Dec 30, 2025 · Dec 30, 2025
diff --git a/tlm/api.py b/tlm/api.py
@@ -20,7 +20,8 @@ async def inference(
         rag=(context is not None),
         constrain_outputs=config_input.constrain_outputs,
     )
-    config = Config.from_input(config_input, workflow_type)
+    model = openai_args.get("model")
+    config = Config.from_input(config_input, workflow_type, model)
     return await tlm_inference(
         completion_params=openai_args,
         response=response,

diff --git a/tlm/config/base.py b/tlm/config/base.py
@@ -10,6 +10,10 @@
 from tlm.config.provider import ModelProvider
 from tlm.types import SimilarityMeasure
 
+from tlm.config.defaults import get_settings
+
+settings = get_settings()
+
 
 class ReferenceCompletionConfigInput(BaseModel):
     num_reference_completions: int | None = Field(
@@ -109,7 +113,7 @@ class BaseConfig(
 
 class Config(BaseConfig):
     @classmethod
-    def from_input(cls, input: ConfigInput, workflow_type: WorkflowType) -> "Config":
+    def from_input(cls, input: ConfigInput, workflow_type: WorkflowType, model: str | None) -> "Config":
         defaults_for_quality = DEFAULT_CONFIG_FOR_QUALITY[input.quality_preset]
         defaults_for_workflow = DEFAULT_CONFIG_FOR_QUALITY_AND_WORKFLOW[input.quality_preset].get(
             workflow_type
@@ -120,6 +124,7 @@ def from_input(cls, input: ConfigInput, workflow_type: WorkflowType) -> "Config"
         params = {
             "reasoning_effort": reasoning_default,
             "use_prompt_evaluation": workflow_type == WorkflowType.RAG,
+            "model": model or settings.DEFAULT_MODEL,
             **defaults_for_quality,
             **defaults_for_workflow,
             "similarity_measure": SimilarityMeasure.for_workflow(workflow_type),