Skip to content

Commit 2ce2bd5

Browse files
committed
run the x64 ci on regular machines
1 parent 432cf43 commit 2ce2bd5

File tree

2 files changed

+39
-15
lines changed

2 files changed

+39
-15
lines changed

.github/workflows/build.yml

Lines changed: 28 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1251,17 +1251,29 @@ jobs:
12511251
# TODO: simplify the following workflows using a matrix
12521252
# TODO: run lighter CI on PRs and the full CI only on master (if needed)
12531253
ggml-ci-x64-cpu-low-perf:
1254-
runs-on: [self-hosted, Linux, X64, CPU, low-perf]
1254+
runs-on: ubuntu-22.04
12551255

12561256
steps:
12571257
- name: Clone
12581258
id: checkout
12591259
uses: actions/checkout@v4
12601260

1261+
- name: ccache
1262+
uses: ggml-org/[email protected]
1263+
with:
1264+
key: ggml-ci-x64-cpu-low-perf
1265+
evict-old-files: 1d
1266+
1267+
- name: Dependencies
1268+
id: depends
1269+
run: |
1270+
sudo apt-get update
1271+
sudo apt-get install build-essential libcurl4-openssl-dev
1272+
12611273
- name: Test
12621274
id: ggml-ci
12631275
run: |
1264-
bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
1276+
LLAMA_ARG_THREADS=$(nproc) GG_BUILD_LOW_PERF=1 bash ./ci/run.sh ./tmp/results ./tmp/mnt
12651277
12661278
ggml-ci-arm64-cpu-low-perf:
12671279
runs-on: [self-hosted, Linux, ARM64, CPU, low-perf]
@@ -1277,17 +1289,29 @@ jobs:
12771289
bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
12781290
12791291
ggml-ci-x64-cpu-high-perf:
1280-
runs-on: [self-hosted, Linux, X64, CPU, high-perf]
1292+
runs-on: ubuntu-22.04
12811293

12821294
steps:
12831295
- name: Clone
12841296
id: checkout
12851297
uses: actions/checkout@v4
12861298

1299+
- name: ccache
1300+
uses: ggml-org/[email protected]
1301+
with:
1302+
key: ggml-ci-x64-cpu-high-perf
1303+
evict-old-files: 1d
1304+
1305+
- name: Dependencies
1306+
id: depends
1307+
run: |
1308+
sudo apt-get update
1309+
sudo apt-get install build-essential libcurl4-openssl-dev
1310+
12871311
- name: Test
12881312
id: ggml-ci
12891313
run: |
1290-
bash ./ci/run.sh ~/results/llama.cpp /mnt/llama.cpp
1314+
LLAMA_ARG_THREADS=$(nproc) bash ./ci/run.sh ./tmp/results ./tmp/mnt
12911315
12921316
ggml-ci-arm64-cpu-high-perf:
12931317
runs-on: [self-hosted, Linux, ARM64, CPU, high-perf]

ci/run.sh

Lines changed: 11 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -339,16 +339,16 @@ function gg_run_qwen3_0_6b {
339339

340340
wiki_test="${path_wiki}/wiki.test.raw"
341341

342-
./bin/llama-quantize ${model_bf16} ${model_q8_0} q8_0
343-
./bin/llama-quantize ${model_bf16} ${model_q4_0} q4_0
344-
./bin/llama-quantize ${model_bf16} ${model_q4_1} q4_1
345-
./bin/llama-quantize ${model_bf16} ${model_q5_0} q5_0
346-
./bin/llama-quantize ${model_bf16} ${model_q5_1} q5_1
347-
./bin/llama-quantize ${model_bf16} ${model_q2_k} q2_k
348-
./bin/llama-quantize ${model_bf16} ${model_q3_k} q3_k
349-
./bin/llama-quantize ${model_bf16} ${model_q4_k} q4_k
350-
./bin/llama-quantize ${model_bf16} ${model_q5_k} q5_k
351-
./bin/llama-quantize ${model_bf16} ${model_q6_k} q6_k
342+
./bin/llama-quantize ${model_bf16} ${model_q8_0} q8_0 $(nproc)
343+
./bin/llama-quantize ${model_bf16} ${model_q4_0} q4_0 $(nproc)
344+
./bin/llama-quantize ${model_bf16} ${model_q4_1} q4_1 $(nproc)
345+
./bin/llama-quantize ${model_bf16} ${model_q5_0} q5_0 $(nproc)
346+
./bin/llama-quantize ${model_bf16} ${model_q5_1} q5_1 $(nproc)
347+
./bin/llama-quantize ${model_bf16} ${model_q2_k} q2_k $(nproc)
348+
./bin/llama-quantize ${model_bf16} ${model_q3_k} q3_k $(nproc)
349+
./bin/llama-quantize ${model_bf16} ${model_q4_k} q4_k $(nproc)
350+
./bin/llama-quantize ${model_bf16} ${model_q5_k} q5_k $(nproc)
351+
./bin/llama-quantize ${model_bf16} ${model_q6_k} q6_k $(nproc)
352352

353353
(time ./bin/llama-cli -no-cnv --model ${model_f16} -ngl 99 -c 1024 -s 1234 -n 64 --ignore-eos -p "I believe the meaning of life is" ) 2>&1 | tee -a $OUT/${ci}-tg-f16.log
354354
(time ./bin/llama-cli -no-cnv --model ${model_bf16} -ngl 99 -c 1024 -s 1234 -n 64 --ignore-eos -p "I believe the meaning of life is" ) 2>&1 | tee -a $OUT/${ci}-tg-bf16.log
@@ -421,7 +421,7 @@ function gg_run_qwen3_0_6b {
421421
function gg_sum_qwen3_0_6b {
422422
gg_printf '### %s\n\n' "${ci}"
423423

424-
gg_printf 'Pythia 2.8B:\n'
424+
gg_printf 'Qwen3 0.6B:\n'
425425
gg_printf '- status: %s\n' "$(cat $OUT/${ci}.exit)"
426426
gg_printf '- perplexity:\n%s\n' "$(cat $OUT/${ci}-ppl.log)"
427427
gg_printf '- imatrix:\n```\n%s\n```\n' "$(cat $OUT/${ci}-imatrix-sum.log)"

0 commit comments

Comments
 (0)