Major Features: - Debug counter infrastructure for Refill Stage tracking - Free Pipeline counters (ss_local, ss_remote, tls_sll) - Diagnostic counters for early return analysis - Unified larson.sh benchmark runner with profiles - Phase 6-3 regression analysis documentation Bug Fixes: - Fix SuperSlab disabled by default (HAKMEM_TINY_USE_SUPERSLAB) - Fix profile variable naming consistency - Add .gitignore patterns for large files Performance: - Phase 6-3: 4.79 M ops/s (has OOM risk) - With SuperSlab: 3.13 M ops/s (+19% improvement) This is a clean repository without large log files. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
67 lines
1.7 KiB
Bash
67 lines
1.7 KiB
Bash
#!/usr/bin/env bash
|
|
set -euo pipefail
|
|
|
|
# Sweep Ultra params for 16/32/64B: per-class batch and sll cap
|
|
# Usage: scripts/sweep_ultra_params.sh [cycles] [batch]
|
|
|
|
ROOT_DIR=$(cd "$(dirname "$0")/.." && pwd)
|
|
cd "$ROOT_DIR"
|
|
|
|
cycles=${1:-60000}
|
|
batch=${2:-200}
|
|
|
|
make -s bench_fast >/dev/null
|
|
|
|
TS=$(date +%Y%m%d_%H%M%S)
|
|
OUTDIR="bench_results/ultra_param_${TS}"
|
|
mkdir -p "$OUTDIR"
|
|
CSV="$OUTDIR/results.csv"
|
|
echo "size,class,batch_size,sll_cap,bench_batch,cycles,throughput_mops" > "$CSV"
|
|
|
|
size_to_class() {
|
|
case "$1" in
|
|
16) echo 1;;
|
|
32) echo 2;;
|
|
64) echo 3;;
|
|
*) echo -1;;
|
|
esac
|
|
}
|
|
|
|
run_case() {
|
|
local size="$1"; shift
|
|
local ubatch="$1"; shift
|
|
local cap="$1"; shift
|
|
local cls=$(size_to_class "$size")
|
|
local log="$OUTDIR/u_${size}_b=${ubatch}_cap=${cap}.log"
|
|
local BVAR="HAKMEM_TINY_ULTRA_BATCH_C${cls}=${ubatch}"
|
|
local CVAR="HAKMEM_TINY_ULTRA_SLL_CAP_C${cls}=${cap}"
|
|
env HAKMEM_TINY_ULTRA=1 HAKMEM_TINY_ULTRA_VALIDATE=0 HAKMEM_TINY_MAG_CAP=128 \
|
|
"$BVAR" "$CVAR" \
|
|
./bench_tiny_hot_hakmem "$size" "$batch" "$cycles" >"$log" 2>&1 || true
|
|
thr=$(sed -n 's/^Throughput: \([0-9.][0-9.]*\) M ops.*/\1/p' "$log" | tail -n1)
|
|
if [[ -n "$thr" ]]; then
|
|
echo "$size,$cls,$ubatch,$cap,$batch,$cycles,$thr" >> "$CSV"
|
|
fi
|
|
}
|
|
|
|
# Modest sweep ranges for speed
|
|
b16=(64 80 96)
|
|
c16=(256 384)
|
|
b32=(96 112 128)
|
|
c32=(256 384)
|
|
b64=(192 224 256)
|
|
c64=(768 1024)
|
|
|
|
for bb in "${b16[@]}"; do
|
|
for cc in "${c16[@]}"; do run_case 16 "$bb" "$cc"; done
|
|
done
|
|
for bb in "${b32[@]}"; do
|
|
for cc in "${c32[@]}"; do run_case 32 "$bb" "$cc"; done
|
|
done
|
|
for bb in "${b64[@]}"; do
|
|
for cc in "${c64[@]}"; do run_case 64 "$bb" "$cc"; done
|
|
done
|
|
|
|
echo "[done] CSV: $CSV"
|
|
sed -n '1,40p' "$CSV" || true
|