Use docker image to run CI tests

rugvedS07 · rugvedS07 · commit 1be7bff06f03 · 2025-08-15T11:35:37.000-04:00
diff --git a/.github/actions/docker-daemon-run/action.yml b/.github/actions/docker-daemon-run/action.yml
@@ -0,0 +1,85 @@
+name: Run Daemon Docker Container
+description: Pulls and runs LM Studio Daemon Docker image for testing
+
+inputs:
+  docker-image:
+    description: "Full Docker image name"
+    required: true
+  container-name:
+    description: "Name for the container"
+    required: false
+    default: "llmster-test"
+  port:
+    description: "Port to expose (host:container)"
+    required: false
+    default: "1234:1234"
+
+outputs:
+  container-id:
+    description: "The ID of the running container"
+    value: ${{ steps.run-container.outputs.container-id }}
+  container-name:
+    description: "The name of the running container"
+    value: ${{ inputs.container-name }}
+
+runs:
+  using: "composite"
+  steps:
+    - name: Pull Docker image
+      shell: bash
+      run: |
+        echo "Pulling image: ${{ inputs.docker-image }}"
+        docker pull ${{ inputs.docker-image }}
+
+    - name: Run container
+      id: run-container
+      shell: bash
+      run: |
+        echo "Starting container: ${{ inputs.container-name }}"
+        if [ "${{ inputs.use-local-image }}" = "true" ]; then
+          echo "Using local image: ${{ inputs.docker-image }}"
+        else
+          echo "Using registry image: ${{ inputs.docker-image }}"
+        fi
+        CONTAINER_ID=$(docker run -d --name ${{ inputs.container-name }} -p ${{ inputs.port }} ${{ inputs.docker-image }})
+        echo "Container ID: $CONTAINER_ID"
+        echo "container-id=$CONTAINER_ID" >> $GITHUB_OUTPUT
+
+        # Wait for container to become healthy
+        TIMEOUT=120  # timeout in seconds (increased to account for start-period)
+        START_TIME=$(date +%s)
+        END_TIME=$((START_TIME + TIMEOUT))
+
+        # Start with 1 second delay, then exponentially increase
+        DELAY=1
+        MAX_DELAY=16  # Cap maximum delay at 16 seconds
+
+        while [ $(date +%s) -lt $END_TIME ]; do
+          HEALTH_STATUS=$(docker inspect --format='{{.State.Health.Status}}' ${{ inputs.container-name }} 2>/dev/null || echo "unknown")
+
+          if [ "$HEALTH_STATUS" = "healthy" ]; then
+            echo "Container is running!"
+            break
+          elif [ "$HEALTH_STATUS" = "unhealthy" ]; then
+            echo "Container is unhealthy - exiting"
+            docker logs ${{ inputs.container-name }}
+            exit 1
+          fi
+
+          ELAPSED=$(($(date +%s) - START_TIME))
+
+          sleep $DELAY
+          DELAY=$((DELAY * 2))
+          if [ $DELAY -gt $MAX_DELAY ]; then
+            DELAY=$MAX_DELAY
+          fi
+        done
+
+        # Final check after waiting for the maximum timeout
+        # Print logs and the health status
+        if [ $(date +%s) -ge $END_TIME ]; then
+          echo "Container health check timed out after ${TIMEOUT} seconds"
+          echo "Final health status: $(docker inspect --format='{{.State.Health.Status}}' ${{ inputs.container-name }})"
+          docker logs ${{ inputs.container-name }}
+          exit 1
+        fi
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
@@ -73,6 +73,50 @@ jobs:
           restore-keys: |
             pip-${{ matrix.os }}-${{ matrix.python-version }}-v1-
 
+      - name: Run the built image
+        id: run
+        uses: ./.github/actions/docker-daemon-run
+        with:
+          docker-image: lmstudio/llmster-preview:cpu
+          # Use the same port as the always on API server
+          port: "41343:1234"
+
+      - name: Download models for tests (Ubuntu only)
+        if: matrix.os == 'ubuntu-22.04'
+        run: |
+          echo "Downloading required models..."
+
+          # Download text LLMs
+          docker exec llmster lms get https://huggingface.co/hugging-quants/Llama-3.2-1B-Instruct-Q4_K_M-GGUF -y
+          docker exec llmster lms get https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-GGUF -y
+          docker exec llmster lms get https://huggingface.co/ZiangWu/MobileVLM_V2-1.7B-GGUF -y
+
+          # Download vision LLM
+          docker exec llmster lms get ZiangWu/MobileVLM_V2-1.7B-GGUF -y
+
+          # Download additional model for speculative decoding examples
+          docker exec llmster lms get qwen2.5-0.5b-instruct -y
+
+          echo "Model downloads complete"
+
+      - name: Load models into LM Studio (Ubuntu only)
+        if: matrix.os == 'ubuntu-22.04'
+        run: |
+          echo "Loading models..."
+
+          # Load embedding model
+          docker exec llmster lms load nomic-embed-text-v1.5 --identifier text-embedding-nomic-embed-text-v1.5 -y
+
+          # Load text LLMs
+          docker exec llmster lms load llama-3.2-1b-instruct --identifier llama-3.2-1b-instruct -y
+          docker exec llmster lms load qwen2.5-7b-instruct --identifier qwen2.5-7b-instruct-1m -y
+          docker exec llmster lms load smollm2-135m-instruct --identifier smollm2-135m-instruct -y
+
+          # Load vision LLM
+          docker exec llmster lms load ZiangWu/MobileVLM_V2-1.7B-GGUF --identifier mobilevlm_v2-1.7b
+
+          echo "Model loading complete"
+
       - name: Install PDM
         run: |
           # Ensure `pdm` uses the same version as specified in `pdm.lock`
@@ -92,11 +136,18 @@ jobs:
           source "$VIRTUAL_ENV_BIN_DIR/activate"
           python -m tox -v -m static
 
-      - name: CI-compatible tests
+      - name: CI-compatible tests (Windows)
+        if: matrix.os == 'windows-2022'
         run: |
           source "$VIRTUAL_ENV_BIN_DIR/activate"
           python -m tox -v -- -m 'not lmstudio'
 
+      - name: All tests including LM Studio (Ubuntu)
+        if: matrix.os == 'ubuntu-22.04'
+        run: |
+          source "$VIRTUAL_ENV_BIN_DIR/activate"
+          python -m tox -v
+
       - name: Upload coverage data
         uses: actions/upload-artifact@v4
         with:
@@ -105,6 +156,12 @@ jobs:
           include-hidden-files: true
           if-no-files-found: ignore
 
+      - name: Stop LM Studio Docker container (Ubuntu only)
+        if: matrix.os == 'ubuntu-22.04' && always()
+        run: |
+          docker stop llmster || true
+          docker rm llmster || true
+
   # Coverage check based on https://hynek.me/articles/ditch-codecov-python/
   coverage:
     name: Combine & check coverage
@@ -143,12 +200,10 @@ jobs:
           # Report again and fail if under 50%.
           # Highest historical coverage: 65%
           # Last noted local test coverage level: 94%
-          # CI coverage percentage is low because many of the tests
-          # aren't CI compatible (they need a local LM Studio instance).
-          # It's only as high as it is because the generated data model
-          # classes make up such a large portion of the total SDK code.
-          # Accept anything over 50% until CI is set up to run LM Studio
-          # in headless mode, and hence is able to run end-to-end tests.
+          # Ubuntu runners now run LM Studio in Docker, so they achieve higher
+          # coverage than Windows runners (which skip LM Studio tests).
+          # The generated data model classes make up a large portion of the SDK code.
+          # Accept anything over 50% as Windows runners still skip LM Studio tests.
           coverage report --fail-under=50
 
       - name: Upload HTML report if check failed