stackhpc
diff --git a/‎.github/workflows/build-push-artifacts.yml
Lines changed: 2 additions & 1 deletion b/‎.github/workflows/build-push-artifacts.yml
Lines changed: 2 additions & 1 deletion
diff --git a/‎.helmignore
Lines changed: 4 additions & 2 deletions b/‎.helmignore
Lines changed: 4 additions & 2 deletions
diff --git a/‎app-dev.py
Lines changed: 0 additions & 59 deletions b/‎app-dev.py
Lines changed: 0 additions & 59 deletions
diff --git a/‎images/ui-base/Dockerfile
Lines changed: 1 addition & 1 deletion b/‎images/ui-base/Dockerfile
Lines changed: 1 addition & 1 deletion
diff --git a/‎templates/ui/app-config-map.yml
Lines changed: 3 additions & 1 deletion b/‎templates/ui/app-config-map.yml
Lines changed: 3 additions & 1 deletion
diff --git a/‎templates/ui/deployment.yml
Lines changed: 2 additions & 1 deletion b/‎templates/ui/deployment.yml
Lines changed: 2 additions & 1 deletion
diff --git a/‎values.yaml
Lines changed: 8 additions & 4 deletions b/‎values.yaml
Lines changed: 8 additions & 4 deletions
diff --git a/‎web-app-utils/example_app_playful.py
Lines changed: 0 additions & 58 deletions b/‎web-app-utils/example_app_playful.py
Lines changed: 0 additions & 58 deletions
diff --git a/‎web-app-utils/example_app_vanilla.py
Lines changed: 0 additions & 62 deletions b/‎web-app-utils/example_app_vanilla.py
Lines changed: 0 additions & 62 deletions
diff --git a/‎web-app-utils/api_startup_check.py renamed to ‎web-app/api_startup_check.py
Lines changed: 4 additions & 2 deletions b/‎web-app-utils/api_startup_check.py renamed to ‎web-app/api_startup_check.py
Lines changed: 4 additions & 2 deletions
@@ -35,14 +35,15 @@ jobs:
             type=sha,prefix=
 
       - name: Build and push image
-        uses: stackhpc/github-actions/docker-multiarch-build-push@master
+        uses: stackhpc/github-actions/docker-multiarch-build-push@allow-continue-after-scan
         with:
           cache-key: ${{ matrix.component }}-base
           context: ./images/${{ matrix.component }}-base
           platforms: linux/amd64 #,linux/arm64
           push: true
           tags: ${{ steps.image-meta.outputs.tags }}
           labels: ${{ steps.image-meta.outputs.labels }}
+          fail_on_high_severity_cve: false
 
   build_push_chart:
     name: Build and push Helm chart
 
@@ -25,8 +25,10 @@
 # Others
 README.md
 Dockerfile
-gradio-app.py
 kubeconfig.yml
 venv/
 __pycache__/
-images/
+images/
+.hf-token.secret
+hu-poc/
+test-values.yaml
@@ -3,4 +3,4 @@ FROM python:3.11-slim
 
 ENV GRADIO_SERVER_PORT=7680
 
-RUN pip install --no-cache-dir gradio==3.50.2 huggingface-hub==0.18.0
+RUN pip install --no-cache-dir gradio==4.10.0 huggingface-hub==0.19.4 pydantic-settings==2.1.0
@@ -5,4 +5,6 @@ metadata:
   labels:
     {{- include "azimuth-llm.labels" . | nindent 4 }}
 data:
-{{ (.Files.Glob "web-app-utils/*").AsConfig | nindent 2 }}
+{{ (.Files.Glob "web-app/*").AsConfig | nindent 2 }}
+  settings.yml: |
+    {{- .Values.ui.appSettings | toYaml | nindent 4 }}
@@ -22,13 +22,14 @@ spec:
         ports:
         - name: ui
           containerPort: 7680
+        workingDir: /etc/web-app
         volumeMounts:
         - name: app
           mountPath: /etc/web-app
         command: 
         - python
         args:
-        - {{ printf "/etc/web-app/%s" .Values.ui.entrypoint }}
+        - {{ .Values.ui.entrypoint }}
         env:
         - name: PYTHONUNBUFFERED
           value: "1"
 
@@ -29,8 +29,8 @@ huggingface:
 api:
   # Container image config
   image:
-    repository: ghcr.io/stackhpc/azimuth-llm-api-base
-    version: "6876068"
+    repository: vllm/vllm-openai
+    version: v0.2.4
   # Service config 
   service:
     name: llm-backend
@@ -65,8 +65,12 @@ api:
 
 # Configuration for the frontend web interface
 ui:
-  # The file from the UI config map to execute as the frontend app
-  entrypoint: example_app_vanilla.py
+  # The file from the UI config map to execute as the entrypoint to the frontend app
+  entrypoint: app.py
+  # The values to be written to settings.yml for parsing as frontend app setting
+  # (see example_app.py and config.py for example using pydantic-settings to configure app)
+  appSettings:
+    prompt_template: ""
   # Container image config
   image:
     repository: ghcr.io/stackhpc/azimuth-llm-ui-base
 
@@ -1,4 +1,5 @@
 import requests, time
+from urllib.parse import urljoin
 
 
 def wait_for_backend(url):
@@ -7,10 +8,11 @@ def wait_for_backend(url):
     accept requests until the backend API is up and running.
     """
     ready = False
+    endpoint = urljoin(url, "/health")
     while not ready:
         try:
-            ready = requests.get(f"{url}/health").status_code == 200
-            print("Waiting for backend API to start")
+            ready = requests.get(endpoint).status_code == 200
+            print(f"Waiting for 200 status from backend API at {endpoint}")
             time.sleep(1)
         except requests.exceptions.ConnectionError as e:
             pass
Original file line number	Diff line number	Diff line change
`@@ -3,4 +3,4 @@ FROM python:3.11-slim`
`3`	`3`
`4`	`4`	`ENV GRADIO_SERVER_PORT=7680`
`5`	`5`
`6`		`-RUN pip install --no-cache-dir gradio==3.50.2 huggingface-hub==0.18.0`
	`6`	`+RUN pip install --no-cache-dir gradio==4.10.0 huggingface-hub==0.19.4 pydantic-settings==2.1.0`