File size: 897 Bytes
d02bacd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
#!/usr/bin/env bash
# One-liner to train the Chief of Staff locally and refresh the ablation table.
# Outputs:
#   training/checkpoints/cos_ckpt0.pt + cos_final.pt
#   training/reward_curves/reward_curve.png
#   training/reward_curves/before_after.json
#   cache/ablation_results.json  (now includes trained_cos arm)
set -euo pipefail

ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
cd "$ROOT"

EPISODES="${EPISODES:-600}"
LR="${LR:-3e-3}"

echo "[run_training] episodes=$EPISODES lr=$LR"
python3 training/train_cos_local.py --episodes "$EPISODES" --lr "$LR" --seed 0

echo "[run_training] refreshing ablation table (now with trained CoS arm)"
python3 inference.py --ablation

echo "[run_training] done"
echo "  - reward curve: training/reward_curves/reward_curve.png"
echo "  - before/after: training/reward_curves/before_after.json"
echo "  - ablation:     cache/ablation_results.json"