From 587d4c9934f0bf5ae816c551ff49b3ccba91b6b1 Mon Sep 17 00:00:00 2001 From: Natalie Date: Mon, 4 May 2026 17:51:24 -0400 Subject: [PATCH] =?UTF-8?q?feat(@projects/@magic-civilization):=20?= =?UTF-8?q?=E2=9C=A8=20add=20ai-quality-baseline=20mode?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-Authored-By: Lilith Autocommit --- scripts/apricot-run.sh | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) diff --git a/scripts/apricot-run.sh b/scripts/apricot-run.sh index 23e45c21..872fcd76 100755 --- a/scripts/apricot-run.sh +++ b/scripts/apricot-run.sh @@ -62,6 +62,7 @@ case "${MODE}" in difficulty-asym) _seed_count_peek="${3:-10}" ;; # $1 p0 tier, $2 p1 tier, $3 seeds matchup-grid) _seed_count_peek="${1:-5}" ;; # $1 is seeds_per_pair (default 5); total=10pairs*seeds huge-map-5clan) _seed_count_peek="${1:-5}" ;; # $1 is seeds + ai-quality-baseline*) _seed_count_peek="${1:-50}" ;; # $1 seeds-per-tier *) _seed_count_peek="${1:-10}" ;; # smoke, gpu-walltime esac @@ -285,6 +286,25 @@ case "${MODE}" in HUGE_OUTPUT='${REMOTE_HUGE}' \ bash tools/huge-map-5clan.sh 2>&1 | tail -40" ;; + ai-quality-baseline|ai-quality-baseline-pre-c|ai-quality-baseline-post-c) + # p0-20 Phase C — empirical AI-quality baseline. + # Runs `difficulty normal` + `difficulty hard` back-to-back so + # pre-C / post-C comparison covers SEEDS×2 games per build with one + # build+worktree setup. Trailing ` ` are optional and + # default to `normal hard`. + SEEDS="${1:-50}"; TURNS="${2:-300}" + TIER1="${3:-normal}"; TIER2="${4:-hard}" + GPU_ENV="AI_GPU_ROLLOUT=${AI_GPU_ROLLOUT:-false}" + echo "[$(date +%H:%M:%S)] ai-quality-baseline (${MODE}): ${SEEDS} seeds × ${TIER1}+${TIER2}, T${TURNS}, PARALLEL=${PARALLEL}" + for TIER in "${TIER1}" "${TIER2}"; do + echo " --- baseline tier=${TIER} ---" + ssh "${APRICOT}" "set -euo pipefail; cd '${SCRATCH_ABS}' && \ + AI_USE_MCTS=true AI_DIFFICULTY='${TIER}' \ + AI_DIFFICULTY_P0='${TIER}' AI_DIFFICULTY_P1='${TIER}' \ + ${GPU_ENV} PARALLEL=${PARALLEL} \ + bash tools/autoplay-batch.sh ${SEEDS} ${TURNS} ${RESULTS_ABS}/baseline-${TIER} 2>&1 | tail -20" + done + ;; *) echo "ERROR: unknown mode '${MODE}'" >&2 exit 2