Spaces:
Running
Running
| # One-liner to train the Chief of Staff locally and refresh the ablation table. | |
| # Outputs: | |
| # training/checkpoints/cos_ckpt0.pt + cos_final.pt | |
| # training/reward_curves/reward_curve.png | |
| # training/reward_curves/before_after.json | |
| # cache/ablation_results.json (now includes trained_cos arm) | |
| set -euo pipefail | |
| ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)" | |
| cd "$ROOT" | |
| EPISODES="${EPISODES:-600}" | |
| LR="${LR:-3e-3}" | |
| echo "[run_training] episodes=$EPISODES lr=$LR" | |
| python3 training/train_cos_local.py --episodes "$EPISODES" --lr "$LR" --seed 0 | |
| echo "[run_training] refreshing ablation table (now with trained CoS arm)" | |
| python3 inference.py --ablation | |
| echo "[run_training] done" | |
| echo " - reward curve: training/reward_curves/reward_curve.png" | |
| echo " - before/after: training/reward_curves/before_after.json" | |
| echo " - ablation: cache/ablation_results.json" | |