Merge pull request #374 from DefangLabs/linda-use-haiku

commit111 · web-flow · commit 9e18a8ae8d28 · 2025-05-16T16:43:24.000-07:00
Use Haiku on Managed LLM
diff --git a/samples/managed-llm-provider/README.md b/samples/managed-llm-provider/README.md
@@ -41,7 +41,7 @@ For this sample, you will need to provide the following [configuration](https://
 > Note that if you are using the 1-click deploy option, you can set these values as secrets in your GitHub repository and the action will automatically deploy them for you.
 
 ### `MODEL`
-The Model ID of the LLM you are using for your application. For example, `anthropic.claude-3-5-sonnet-20241022-v2:0`.
+The Model ID of the LLM you are using for your application. For example, `anthropic.claude-3-haiku-20240307-v1:0`.
 ```bash
 defang config set MODEL
 ```
diff --git a/samples/managed-llm-provider/compose.yaml b/samples/managed-llm-provider/compose.yaml
@@ -8,7 +8,7 @@ services:
     restart: always
     environment:
       - ENDPOINT_URL=http://llm/api/v1/chat/completions   # endpoint to the Provider Service
-      - MODEL=anthropic.claude-3-5-sonnet-20241022-v2:0   # LLM model ID used in the Provider Service
+      - MODEL=anthropic.claude-3-haiku-20240307-v1:0   # LLM model ID used in the Provider Service
       - OPENAI_API_KEY=FAKE_TOKEN   # the actual value will be ignored when using the Provider Service
     healthcheck:
       test: ["CMD", "python3", "-c", "import sys, urllib.request; urllib.request.urlopen(sys.argv[1]).read()", "http://localhost:8000/"]
diff --git a/samples/managed-llm/README.md b/samples/managed-llm/README.md
@@ -42,7 +42,7 @@ For this sample, you will need to provide the following [configuration](https://
 > Note that if you are using the 1-click deploy option, you can set these values as secrets in your GitHub repository and the action will automatically deploy them for you.
 
 ### `MODEL`
-The Model ID of the LLM you are using for your application. For example, `anthropic.claude-3-5-sonnet-20241022-v2:0`.
+The Model ID of the LLM you are using for your application. For example, `anthropic.claude-3-haiku-20240307-v1:0`.
 ```bash
 defang config set MODEL
 ```
diff --git a/samples/managed-llm/compose.yaml b/samples/managed-llm/compose.yaml
@@ -8,7 +8,7 @@ services:
     restart: always
     environment:
       - ENDPOINT_URL=http://llm/api/v1/chat/completions   # endpoint to the gateway service
-      - MODEL=anthropic.claude-3-5-sonnet-20241022-v2:0   # LLM model ID used for the gateway
+      - MODEL=anthropic.claude-3-haiku-20240307-v1:0  # LLM model ID used for the gateway
       - OPENAI_API_KEY=FAKE_TOKEN   # the actual value will be ignored when using the gateway, but it should match the one in the llm service
     healthcheck:
       test: ["CMD", "python3", "-c", "import sys, urllib.request; urllib.request.urlopen(sys.argv[1]).read()", "http://localhost:8000/"]