5757jobs :
5858 determine-tag :
5959 name : Determine tag name
60- runs-on : ubuntu-slim
60+ runs-on : [self-hosted, fast]
6161 outputs :
6262 tag_name : ${{ steps.tag.outputs.name }}
6363 steps :
8686 HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
8787 run : |
8888 nvidia-smi
89- GG_BUILD_CUDA=1 bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
89+ GG_BUILD_CUDA=1 bash ./ci/run.sh ~/results/llama.cpp ~ /mnt/llama.cpp
9090
9191 ggml-ci-nvidia-vulkan-cm :
9292 needs : determine-tag
@@ -103,7 +103,7 @@ jobs:
103103 HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
104104 run : |
105105 vulkaninfo --summary
106- GG_BUILD_VULKAN=1 GGML_VK_DISABLE_COOPMAT2=1 bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
106+ GG_BUILD_VULKAN=1 GGML_VK_DISABLE_COOPMAT2=1 bash ./ci/run.sh ~/results/llama.cpp ~ /mnt/llama.cpp
107107
108108 ggml-ci-nvidia-vulkan-cm2 :
109109 needs : determine-tag
@@ -120,10 +120,11 @@ jobs:
120120 HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
121121 run : |
122122 vulkaninfo --summary
123- GG_BUILD_VULKAN=1 bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
123+ GG_BUILD_VULKAN=1 bash ./ci/run.sh ~/results/llama.cpp ~ /mnt/llama.cpp
124124
125125 ggml-ci-nvidia-webgpu :
126- runs-on : [self-hosted, Linux, NVIDIA]
126+ needs : determine-tag
127+ runs-on : [self-hosted, Linux, NVIDIA, X64]
127128
128129 steps :
129130 - name : Clone
@@ -149,10 +150,11 @@ jobs:
149150 GG_BUILD_WEBGPU=1 \
150151 GG_BUILD_WEBGPU_DAWN_PREFIX="$GITHUB_WORKSPACE/dawn" \
151152 GG_BUILD_WEBGPU_DAWN_DIR="$GITHUB_WORKSPACE/dawn/lib64/cmake/Dawn" \
152- bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
153+ bash ./ci/run.sh ~/results/llama.cpp ~ /mnt/llama.cpp
153154
154155 # TODO: provision AMX-compatible machine
155156 # ggml-ci-cpu-amx:
157+ # needs: determine-tag
156158 # runs-on: [self-hosted, Linux, CPU, AMX]
157159
158160 # steps:
@@ -163,10 +165,11 @@ jobs:
163165 # - name: Test
164166 # id: ggml-ci
165167 # run: |
166- # bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
168+ # bash ./ci/run.sh ~/results/llama.cpp ~ /mnt/llama.cpp
167169
168170 # TODO: provision AMD GPU machine
169171 # ggml-ci-amd-vulkan:
172+ # needs: determine-tag
170173 # runs-on: [self-hosted, Linux, AMD]
171174
172175 # steps:
@@ -178,10 +181,11 @@ jobs:
178181 # id: ggml-ci
179182 # run: |
180183 # vulkaninfo --summary
181- # GG_BUILD_VULKAN=1 bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
184+ # GG_BUILD_VULKAN=1 bash ./ci/run.sh ~/results/llama.cpp ~ /mnt/llama.cpp
182185
183186 # TODO: provision AMD GPU machine
184187 # ggml-ci-amd-rocm:
188+ # needs: determine-tag
185189 # runs-on: [self-hosted, Linux, AMD]
186190
187191 # steps:
@@ -193,7 +197,7 @@ jobs:
193197 # id: ggml-ci
194198 # run: |
195199 # amd-smi static
196- # GG_BUILD_ROCM=1 GG_BUILD_AMDGPU_TARGETS="gfx1101" bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
200+ # GG_BUILD_ROCM=1 GG_BUILD_AMDGPU_TARGETS="gfx1101" bash ./ci/run.sh ~/results/llama.cpp ~ /mnt/llama.cpp
197201
198202 ggml-ci-mac-metal :
199203 needs : determine-tag
@@ -337,4 +341,66 @@ jobs:
337341 HF_UI_VERSION : ${{ needs.determine-tag.outputs.tag_name }}
338342 run : |
339343 source ./openvino_toolkit/setupvars.sh
340- GG_BUILD_OPENVINO=1 GGML_OPENVINO_DEVICE=GPU GG_BUILD_LOW_PERF=1 bash ./ci/run.sh ./tmp/results ./tmp/mnt
344+ GG_BUILD_OPENVINO=1 GGML_OPENVINO_DEVICE=GPU GG_BUILD_LOW_PERF=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
345+
346+ ggml-ci-arm64-cpu-low-perf :
347+ needs : determine-tag
348+ runs-on : [self-hosted, Linux, ARM64]
349+
350+ steps :
351+ - name : Clone
352+ id : checkout
353+ uses : actions/checkout@v6
354+
355+ - name : Test
356+ id : ggml-ci
357+ run : |
358+ LLAMA_ARG_THREADS=$(nproc) GG_BUILD_LOW_PERF=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
359+
360+ ggml-ci-arm64-cpu-high-perf :
361+ needs : determine-tag
362+ runs-on : [self-hosted, Linux, ARM64]
363+
364+ steps :
365+ - name : Clone
366+ id : checkout
367+ uses : actions/checkout@v6
368+
369+ - name : Test
370+ id : ggml-ci
371+ run : |
372+ LLAMA_ARG_THREADS=$(nproc) GG_BUILD_HIGH_PERF=1 GG_BUILD_NO_SVE=1 GG_BUILD_NO_BF16=1 GG_BUILD_EXTRA_TESTS_0=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
373+
374+ # TODO: not sure how to detect ARM flags on DGX Spark. currently get this error during cmake:
375+ # CMake Warning at ggml/src/ggml-cpu/CMakeLists.txt:147 (message):
376+ # ARM -march/-mcpu not found, -mcpu=native will be used
377+ #
378+ # if we resolve this, we should be able to offload these jobs to the self-hosted runners
379+ #
380+ # ggml-ci-arm64-cpu-high-perf-sve:
381+ # needs: determine-tag
382+ # runs-on: [self-hosted, Linux, NVIDIA, ARM64]
383+ #
384+ # steps:
385+ # - name: Clone
386+ # id: checkout
387+ # uses: actions/checkout@v6
388+ #
389+ # - name: Test
390+ # id: ggml-ci
391+ # run: |
392+ # LLAMA_ARG_THREADS=$(nproc) GG_BUILD_NO_BF16=1 GG_BUILD_EXTRA_TESTS_0=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
393+ #
394+ # ggml-ci-arm64-cpu-kleidiai:
395+ # needs: determine-tag
396+ # runs-on: [self-hosted, Linux, NVIDIA, ARM64]
397+ #
398+ # steps:
399+ # - name: Clone
400+ # id: checkout
401+ # uses: actions/checkout@v6
402+ #
403+ # - name: Test
404+ # id: ggml-ci
405+ # run: |
406+ # GG_BUILD_KLEIDIAI=1 GG_BUILD_EXTRA_TESTS_0=1 bash ./ci/run.sh ~/results/llama.cpp ~/mnt/llama.cpp
0 commit comments