Skip to content

Commit 0381fdf

Browse files
author
sd109
committed
Move test model name out of Tiltfile
1 parent 5ec91ae commit 0381fdf

File tree

1 file changed

+5
-10
lines changed

1 file changed

+5
-10
lines changed

Tiltfile

Lines changed: 5 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,3 @@
1-
# The HuggingFace model to use for testing
2-
# hf_model = "ise-uiuc/Magicoder-S-DS-6.7B" # Good lightweight model for testing
3-
# hf_model = "TheBloke/WizardCoder-Python-34B-V1.0-AWQ" # Poor performance, missing chat_template in repo
4-
hf_model = "TheBloke/SauerkrautLM-70B-v1-AWQ"
5-
# hf_model = "TheBloke/SauerkrautLM-Mixtral-8x7B-Instruct-AWQ" # Works well
6-
# hf_model = "abacusai/Smaug-Mixtral-v0.1" # GPU OOM
7-
# hf_model = "LoneStriker/Smaug-72B-v0.1-AWQ" # Works but produces nonsense responses
8-
91
# Toggles whether UI should be run locally using gradio hot-reloading
102
# or should be included in the remote Helm install
113
run_ui_locally = True
@@ -19,15 +11,18 @@ allow_k8s_contexts('production-llm-service-admin@production-llm-service')
1911

2012
chart_yaml = helm(
2113
"chart/",
22-
values="hu-dev-values.yml",
14+
values="dev-values.yml",
2315
# Enable/disable remote UI install depending on if we're running it locally
2416
set=[
25-
"huggingface.model={}".format(hf_model),
2617
"ui.enabled={}".format(not str(run_ui_locally).lower())
2718
],
2819
)
2920
k8s_yaml(chart_yaml)
3021

22+
# Parse LLM name from templated deployment
23+
api_deployment, _ = filter_yaml(chart_yaml, kind='Deployment', name='chart-api')
24+
hf_model = decode_yaml(api_deployment)['spec']['template']['spec']['containers'][0]['args'][1]
25+
3126
if not run_ui_locally:
3227
# Port-forward web app to localhost:8080
3328
k8s_resource("chart-ui", port_forwards="8080:7680")

0 commit comments

Comments
 (0)