Spaces:
Running
Running
File size: 897 Bytes
d02bacd | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 | #!/usr/bin/env bash
# One-liner to train the Chief of Staff locally and refresh the ablation table.
# Outputs:
# training/checkpoints/cos_ckpt0.pt + cos_final.pt
# training/reward_curves/reward_curve.png
# training/reward_curves/before_after.json
# cache/ablation_results.json (now includes trained_cos arm)
set -euo pipefail
ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
cd "$ROOT"
EPISODES="${EPISODES:-600}"
LR="${LR:-3e-3}"
echo "[run_training] episodes=$EPISODES lr=$LR"
python3 training/train_cos_local.py --episodes "$EPISODES" --lr "$LR" --seed 0
echo "[run_training] refreshing ablation table (now with trained CoS arm)"
python3 inference.py --ablation
echo "[run_training] done"
echo " - reward curve: training/reward_curves/reward_curve.png"
echo " - before/after: training/reward_curves/before_after.json"
echo " - ablation: cache/ablation_results.json"
|