From c67156597b5301fce93b0e1e8f4f20cf4de2420d Mon Sep 17 00:00:00 2001 From: Progeny Alpha Date: Sun, 15 Mar 2026 03:18:45 -0400 Subject: [PATCH] vulkan: add n_ubatch sweep to bench script --- scripts/bench-gdn-chunked.sh | 21 ++++++++++++++++++++- 1 file changed, 20 insertions(+), 1 deletion(-) diff --git a/scripts/bench-gdn-chunked.sh b/scripts/bench-gdn-chunked.sh index d41f4f4b3b..ab872e68d3 100755 --- a/scripts/bench-gdn-chunked.sh +++ b/scripts/bench-gdn-chunked.sh @@ -71,12 +71,31 @@ if ! RESULT=$($BENCH -m "$MODEL" -ngl 99 -fa 1 -n 128 -p 512,1024,2048 --output fi { - echo "## Throughput" + echo "## Throughput (default ubatch)" echo "" echo "$RESULT" | grep -E "^\|" echo "" } >> "$OUT" +echo "Running n_ubatch sweep (PP-2048)..." +{ + echo "## Throughput by n_ubatch (PP-2048)" + echo "" +} >> "$OUT" + +for UB in 256 512 1024 2048; do + echo " ubatch=$UB..." + UB_RESULT=$($BENCH -m "$MODEL" -ngl 99 -fa 1 -n 0 -p 2048 -ub $UB --output md 2>&1) || true + UB_LINE=$(echo "$UB_RESULT" | grep "pp2048" | head -1) + if [ -n "$UB_LINE" ]; then + if [ "$UB" = "256" ]; then + echo "$UB_RESULT" | grep -E "^\| (model|---)" | head -2 >> "$OUT" + fi + echo "$UB_LINE" >> "$OUT" + fi +done +echo "" >> "$OUT" + echo "Running GDN kernel profiling (PP-512)..." PROF=$(GGML_VK_PERF_LOGGER=1 GGML_VK_PERF_LOGGER_FREQUENCY=9999 $BENCH -m "$MODEL" -ngl 99 -fa 1 -n 0 -p 512 2>&1 | grep "GATED_DELTA" | head -5)