llamastack
diff --git a/‎docs/source/providers/inference/index.md‎
Lines changed: 1 addition & 0 deletions b/‎docs/source/providers/inference/index.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/source/providers/inference/remote_azure.md‎
Lines changed: 29 additions & 0 deletions b/‎docs/source/providers/inference/remote_azure.md‎
Lines changed: 29 additions & 0 deletions
diff --git a/‎llama_stack/distributions/ci-tests/build.yaml‎
Lines changed: 1 addition & 0 deletions b/‎llama_stack/distributions/ci-tests/build.yaml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎llama_stack/distributions/ci-tests/run.yaml‎
Lines changed: 7 additions & 0 deletions b/‎llama_stack/distributions/ci-tests/run.yaml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎llama_stack/distributions/starter-gpu/build.yaml‎
Lines changed: 1 addition & 0 deletions b/‎llama_stack/distributions/starter-gpu/build.yaml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎llama_stack/distributions/starter-gpu/run.yaml‎
Lines changed: 7 additions & 0 deletions b/‎llama_stack/distributions/starter-gpu/run.yaml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎llama_stack/distributions/starter/build.yaml‎
Lines changed: 1 addition & 0 deletions b/‎llama_stack/distributions/starter/build.yaml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎llama_stack/distributions/starter/run.yaml‎
Lines changed: 7 additions & 0 deletions b/‎llama_stack/distributions/starter/run.yaml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎llama_stack/distributions/starter/starter.py‎
Lines changed: 18 additions & 0 deletions b/‎llama_stack/distributions/starter/starter.py‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎llama_stack/providers/registry/inference.py‎
Lines changed: 15 additions & 0 deletions b/‎llama_stack/providers/registry/inference.py‎
Lines changed: 15 additions & 0 deletions
@@ -18,6 +18,7 @@ This section contains documentation for all available providers for the **infere
 inline_meta-reference
 inline_sentence-transformers
 remote_anthropic
+remote_azure
 remote_bedrock
 remote_cerebras
 remote_databricks
 
@@ -0,0 +1,29 @@
+# remote::azure
+
+## Description
+
+
+Azure OpenAI inference provider for accessing GPT models and other Azure services.
+Provider documentation
+https://learn.microsoft.com/en-us/azure/ai-foundry/openai/overview
+
+
+## Configuration
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `api_key` | `<class 'pydantic.types.SecretStr'>` | No |  | Azure API key for Azure |
+| `api_base` | `<class 'pydantic.networks.HttpUrl'>` | No |  | Azure API base for Azure (e.g., https://your-resource-name.openai.azure.com) |
+| `api_version` | `str \| None` | No |  | Azure API version for Azure (e.g., 2024-12-01-preview) |
+| `api_type` | `str \| None` | No | azure | Azure API type for Azure (e.g., azure) |
+
+## Sample Configuration
+
+```yaml
+api_key: ${env.AZURE_API_KEY:=}
+api_base: ${env.AZURE_API_BASE:=}
+api_version: ${env.AZURE_API_VERSION:=}
+api_type: ${env.AZURE_API_TYPE:=}
+
+```
+
@@ -17,6 +17,7 @@ distribution_spec:
     - provider_type: remote::vertexai
     - provider_type: remote::groq
     - provider_type: remote::sambanova
+    - provider_type: remote::azure
     - provider_type: inline::sentence-transformers
     vector_io:
     - provider_type: inline::faiss
 
@@ -81,6 +81,13 @@ providers:
     config:
       url: https://api.sambanova.ai/v1
       api_key: ${env.SAMBANOVA_API_KEY:=}
+  - provider_id: ${env.AZURE_API_KEY:+azure}
+    provider_type: remote::azure
+    config:
+      api_key: ${env.AZURE_API_KEY:=}
+      api_base: ${env.AZURE_API_BASE:=}
+      api_version: ${env.AZURE_API_VERSION:=}
+      api_type: ${env.AZURE_API_TYPE:=}
   - provider_id: sentence-transformers
     provider_type: inline::sentence-transformers
   vector_io:
 
@@ -18,6 +18,7 @@ distribution_spec:
     - provider_type: remote::vertexai
     - provider_type: remote::groq
     - provider_type: remote::sambanova
+    - provider_type: remote::azure
     - provider_type: inline::sentence-transformers
     vector_io:
     - provider_type: inline::faiss
 
@@ -81,6 +81,13 @@ providers:
     config:
       url: https://api.sambanova.ai/v1
       api_key: ${env.SAMBANOVA_API_KEY:=}
+  - provider_id: ${env.AZURE_API_KEY:+azure}
+    provider_type: remote::azure
+    config:
+      api_key: ${env.AZURE_API_KEY:=}
+      api_base: ${env.AZURE_API_BASE:=}
+      api_version: ${env.AZURE_API_VERSION:=}
+      api_type: ${env.AZURE_API_TYPE:=}
   - provider_id: sentence-transformers
     provider_type: inline::sentence-transformers
   vector_io:
 
@@ -18,6 +18,7 @@ distribution_spec:
     - provider_type: remote::vertexai
     - provider_type: remote::groq
     - provider_type: remote::sambanova
+    - provider_type: remote::azure
     - provider_type: inline::sentence-transformers
     vector_io:
     - provider_type: inline::faiss
 
@@ -81,6 +81,13 @@ providers:
     config:
       url: https://api.sambanova.ai/v1
       api_key: ${env.SAMBANOVA_API_KEY:=}
+  - provider_id: ${env.AZURE_API_KEY:+azure}
+    provider_type: remote::azure
+    config:
+      api_key: ${env.AZURE_API_KEY:=}
+      api_base: ${env.AZURE_API_BASE:=}
+      api_version: ${env.AZURE_API_VERSION:=}
+      api_type: ${env.AZURE_API_TYPE:=}
   - provider_id: sentence-transformers
     provider_type: inline::sentence-transformers
   vector_io:
 
@@ -59,6 +59,7 @@ def _get_config_for_provider(provider_spec: ProviderSpec) -> dict[str, Any]:
     "cerebras",
     "nvidia",
     "bedrock",
+    "azure",
 ]
 
 INFERENCE_PROVIDER_IDS = {
@@ -68,6 +69,7 @@ def _get_config_for_provider(provider_spec: ProviderSpec) -> dict[str, Any]:
     "cerebras": "${env.CEREBRAS_API_KEY:+cerebras}",
     "nvidia": "${env.NVIDIA_API_KEY:+nvidia}",
     "vertexai": "${env.VERTEX_AI_PROJECT:+vertexai}",
+    "azure": "${env.AZURE_API_KEY:+azure}",
 }
 
 
@@ -277,5 +279,21 @@ def get_distribution_template(name: str = "starter") -> DistributionTemplate:
                 "http://localhost:11434",
                 "Ollama URL",
             ),
+            "AZURE_API_KEY": (
+                "",
+                "Azure API Key",
+            ),
+            "AZURE_API_BASE": (
+                "",
+                "Azure API Base",
+            ),
+            "AZURE_API_VERSION": (
+                "",
+                "Azure API Version",
+            ),
+            "AZURE_API_TYPE": (
+                "azure",
+                "Azure API Type",
+            ),
         },
     )
@@ -295,4 +295,19 @@ def available_providers() -> list[ProviderSpec]:
                 description="IBM WatsonX inference provider for accessing AI models on IBM's WatsonX platform.",
             ),
         ),
+        remote_provider_spec(
+            api=Api.inference,
+            adapter=AdapterSpec(
+                adapter_type="azure",
+                pip_packages=["litellm"],
+                module="llama_stack.providers.remote.inference.azure",
+                config_class="llama_stack.providers.remote.inference.azure.AzureConfig",
+                provider_data_validator="llama_stack.providers.remote.inference.azure.config.AzureProviderDataValidator",
+                description="""
+Azure OpenAI inference provider for accessing GPT models and other Azure services.
+Provider documentation
+https://learn.microsoft.com/en-us/azure/ai-foundry/openai/overview
+""",
+            ),
+        ),
     ]