stackhpc
diff --git a/‎.github/workflows/build-push-artifacts.yml‎
Lines changed: 2 additions & 1 deletion b/‎.github/workflows/build-push-artifacts.yml‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 2 deletions b/‎.gitignore‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎chart/ci/image-analysis-ui-values.yaml‎
Lines changed: 0 additions & 8 deletions b/‎chart/ci/image-analysis-ui-values.yaml‎
Lines changed: 0 additions & 8 deletions
diff --git a/‎chart/values.schema.json‎
Lines changed: 0 additions & 123 deletions b/‎chart/values.schema.json‎
Lines changed: 0 additions & 123 deletions
diff --git a/‎charts/azimuth-chat/Chart.yaml‎
Lines changed: 22 additions & 0 deletions b/‎charts/azimuth-chat/Chart.yaml‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎charts/azimuth-chat/azimuth-ui.schema.yaml‎
Lines changed: 34 additions & 0 deletions b/‎charts/azimuth-chat/azimuth-ui.schema.yaml‎
Lines changed: 34 additions & 0 deletions
diff --git a/‎charts/azimuth-chat/ci/chat-ui-values.yaml‎
Lines changed: 7 additions & 0 deletions b/‎charts/azimuth-chat/ci/chat-ui-values.yaml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎charts/azimuth-chat/values.schema.json‎
Lines changed: 128 additions & 0 deletions b/‎charts/azimuth-chat/values.schema.json‎
Lines changed: 128 additions & 0 deletions
diff --git a/‎charts/azimuth-chat/values.yaml‎
Lines changed: 9 additions & 0 deletions b/‎charts/azimuth-chat/values.yaml‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎charts/azimuth-image-analysis/Chart.yaml‎
Lines changed: 22 additions & 0 deletions b/‎charts/azimuth-image-analysis/Chart.yaml‎
Lines changed: 22 additions & 0 deletions
@@ -28,7 +28,7 @@ jobs:
             images:
               - 'web-apps/**'
             chart:
-              - 'chart/**'
+              - 'charts/**'
 
   # Job to build container images
   build_push_images:
@@ -96,6 +96,7 @@ jobs:
       - name: Publish Helm charts
         uses: azimuth-cloud/github-actions/helm-publish@master
         with:
+          directory: charts
           token: ${{ secrets.GITHUB_TOKEN }}
           version: ${{ steps.semver.outputs.version }}
           app-version: ${{ steps.semver.outputs.short-sha }}
@@ -11,8 +11,8 @@ test-values.y[a]ml
 **venv*/
 
 # Helm chart stuff
-chart/Chart.lock
-chart/charts
+charts/*/Chart.lock
+charts/*/charts
 
 # Python stuff
 **/build/
 
@@ -0,0 +1,22 @@
+apiVersion: v2
+name: azimuth-llm-chat
+description: HuggingFace vision model serving along with a simple web interface.
+maintainers:
+  - name: "Scott Davidson"
+    email: [email protected]
+
+type: application
+
+version: 0.1.0
+
+appVersion: "0.1.0"
+
+icon: https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg
+
+annotations:
+  azimuth.stackhpc.com/label: HuggingFace Image Analysis
+
+dependencies:
+  - name: azimuth-llm
+    version: 0.1.0
+    repository: "file://../azimuth-llm/"
@@ -0,0 +1,34 @@
+controls:
+  /azimuth-llm/huggingface/model:
+    type: TextControl
+    required: true
+  /azimuth-llm/huggingface/token:
+    type: TextControl
+    secret: true
+  # Use mirror to mimic yaml anchor in base Helm chart
+  /azimuth-llm/ui/appSettings/hf_model_name:
+    type: MirrorControl
+    path: /azimuth-llm/huggingface/model
+    visuallyHidden: true
+  # Azimuth UI doesn't handle json type ["integer","null"]
+  # properly so we allow any type in JSON schema then
+  # constrain to (optional) integer here.
+  /azimuth-llm/api/modelMaxContextLength:
+    type: IntegerControl
+    minimum: 100
+    step: 100
+    required: false
+
+sortOrder:
+  - /azimuth-llm/huggingface/model
+  - /azimuth-llm/huggingface/token
+  - /azimuth-llm/ui/appSettings/hf_model_instruction
+  - /azimuth-llm/ui/appSettings/page_title
+  - /azimuth-llm/api/image/version
+  - /azimuth-llm/ui/appSettings/llm_temperature
+  - /azimuth-llm/ui/appSettings/llm_max_tokens
+  - /azimuth-llm/ui/appSettings/llm_frequency_penalty
+  - /azimuth-llm/ui/appSettings/llm_presence_penalty
+  - /azimuth-llm/ui/appSettings/llm_top_p
+  - /azimuth-llm/ui/appSettings/llm_top_k
+  - /azimuth-llm/api/modelMaxContextLength
@@ -0,0 +1,7 @@
+azimuth-llm:
+  api:
+    enabled: false
+  ui:
+    service:
+      zenith:
+        enabled: false
@@ -0,0 +1,128 @@
+{
+    "type": "object",
+    "properties": {
+        "azimuth-llm": {
+            "type": "object",
+            "properties": {
+                "huggingface": {
+                    "type": "object",
+                    "properties": {
+                        "model": {
+                            "type": "string",
+                            "title": "Model",
+                            "description": "The [HuggingFace model](https://huggingface.co/models) to deploy (see [here](https://github.com/stackhpc/azimuth-llm?tab=readme-ov-file#tested-models) for a list of tested models).",
+                            "default": "microsoft/Phi-3.5-mini-instruct"
+                        },
+                        "token": {
+                            "type": [
+                                "string",
+                                "null"
+                            ],
+                            "title": "Access Token",
+                            "description": "A HuggingFace [access token](https://huggingface.co/docs/hub/security-tokens). Required for [gated models](https://huggingface.co/docs/hub/en/models-gated) (e.g. Llama 3)."
+                        }
+                    },
+                    "required": [
+                        "model"
+                    ]
+                },
+                "api": {
+                    "type": "object",
+                    "properties": {
+                        "modelMaxContextLength": {
+                            "title": "Model Context Length",
+                            "description": "An override for the maximum context length to allow, if the model's default is not suitable."
+                        },
+                        "image": {
+                            "type": "object",
+                            "properties": {
+                                "version": {
+                                    "type": "string",
+                                    "title": "Backend vLLM version",
+                                    "description": "The vLLM version to use as a backend. Must be a version tag from [this list](https://github.com/vllm-project/vllm/tags)",
+                                    "default": "v0.6.3"
+                                }
+                            }
+                        }
+                    }
+                },
+                "ui": {
+                    "type": "object",
+                    "properties": {
+                        "appSettings": {
+                            "type": "object",
+                            "properties": {
+                                "model_name": {
+                                    "type": "string",
+                                    "title": "Model Name",
+                                    "description": "Model name supplied to the OpenAI client in frontend web app. Should match huggingface.model above."
+                                },
+                                "model_instruction": {
+                                    "type": "string",
+                                    "title": "Instruction",
+                                    "description": "The initial system prompt (i.e. the hidden instruction) to use when generating responses.",
+                                    "default": "You are a helpful AI assistant. Please respond appropriately."
+                                },
+                                "page_title": {
+                                    "type": "string",
+                                    "title": "Page Title",
+                                    "description": "The title to display at the top of the chat interface.",
+                                    "default": "Large Language Model"
+                                },
+                                "llm_max_tokens": {
+                                    "type": "integer",
+                                    "title": "Max Tokens",
+                                    "description": "The maximum number of new [tokens](https://platform.openai.com/docs/api-reference/chat/create#chat-create-max_tokens) to generate for each LLM responses.",
+                                    "default": 1000
+                                },
+                                "llm_temperature": {
+                                    "type": "number",
+                                    "title": "LLM Temperature",
+                                    "description": "The [temperature](https://platform.openai.com/docs/api-reference/chat/create#chat-create-temperature) value to use when generating LLM responses.",
+                                    "default": 0,
+                                    "minimum": 0,
+                                    "maximum": 2
+                                },
+                                "llm_top_p": {
+                                    "type": "number",
+                                    "title": "LLM Top P",
+                                    "description": "The [top p](https://platform.openai.com/docs/api-reference/chat/create#chat-create-top_p) value to use when generating LLM responses.",
+                                    "default": 1,
+                                    "exclusiveMinimum": 0,
+                                    "maximum": 1
+                                },
+                                "llm_top_k": {
+                                    "type": "integer",
+                                    "title": "LLM Top K",
+                                    "description": "The [top k](https://docs.vllm.ai/en/stable/dev/sampling_params.html) value to use when generating LLM responses (must be an integer).",
+                                    "default": -1,
+                                    "minimum": -1
+                                },
+                                "llm_presence_penalty": {
+                                    "type": "number",
+                                    "title": "LLM Presence Penalty",
+                                    "description": "The [presence penalty](https://platform.openai.com/docs/api-reference/chat/create#chat-create-presence_penalty) to use when generating LLM responses.",
+                                    "default": 0,
+                                    "minimum": -2,
+                                    "maximum": 2
+                                },
+                                "llm_frequency_penalty": {
+                                    "type": "number",
+                                    "title": "LLM Frequency Penalty",
+                                    "description": "The [frequency_penalty](https://platform.openai.com/docs/api-reference/chat/create#chat-create-frequency_penalty) to use when generating LLM responses.",
+                                    "default": 0,
+                                    "minimum": -2,
+                                    "maximum": 2
+                                }
+                            },
+                            "required": [
+                                "model_name",
+                                "model_instruction"
+                            ]
+                        }
+                    }
+                }
+            }
+        }
+    }
+}
@@ -0,0 +1,9 @@
+azimuth-llm:
+  huggingface:
+    model: &model-name microsoft/Phi-3.5-mini-instruct
+  ui:
+    image:
+      repository: ghcr.io/stackhpc/azimuth-llm-chat-ui
+    appSettings:
+      model_name: *model-name
+      model_instruction: "You are a helpful AI assistant; please respond appropriately."
@@ -0,0 +1,22 @@
+apiVersion: v2
+name: azimuth-llm-image-analysis
+description: HuggingFace vision model serving along with a simple web interface.
+maintainers:
+  - name: "Scott Davidson"
+    email: [email protected]
+
+type: application
+
+version: 0.1.0
+
+appVersion: "0.1.0"
+
+icon: https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg
+
+annotations:
+  azimuth.stackhpc.com/label: HuggingFace Image Analysis
+
+dependencies:
+  - name: azimuth-llm
+    version: 0.1.0
+    repository: "file://../azimuth-llm/"