diff --git a/.gitattributes b/.gitattributes index 0da9ba1342f8fc74f2b8f872a3d9d53c588b7343..718b7f93c5ef2950db6379fadeb28789a3c7e4c2 100644 --- a/.gitattributes +++ b/.gitattributes @@ -56,3 +56,84 @@ gen_outputs/Qwen2.5-3B/aime25_t0.6_p0.95_n1280-MNT3072.jsonl filter=lfs diff=lfs gen_outputs/Qwen2.5-3B/math-500_t0.6_p0.95_n192-MNT3072.jsonl filter=lfs diff=lfs merge=lfs -text gen_outputs/Qwen2.5-3B/minerva_t0.6_p0.95_n192-MNT3072.jsonl filter=lfs diff=lfs merge=lfs -text gen_outputs/Qwen2.5-3B/olympiad-bench_t0.6_p0.95_n192-MNT3072.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/base/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/base/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/base/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/base/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/base/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text +gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/gen_outputs/Qwen2.5-3B-Instruct/base/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/base/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0b4f5b187c4c666d9fa4cf3600aadd6ba72b0713 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/base/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d35c3c762db184d895af82703a2f928d72c94750409cf7813601ae53cc9b62fb +size 140095953 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/base/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/base/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ac302e2d8d6f8b270841724187ee629225748466 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/base/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402832720f23d42e2a86c7b9163933c02752801e04b35461e46133ef28455b8e +size 129001016 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/base/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/base/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dfd93509482a43b5d89b7b792a78cb6c5bbb2cd3 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/base/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e4d56b8e81337b8c5183760106cdbc31c1cf5908d0cab73531483ace5e5ea2 +size 199414606 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/base/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/base/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..26e64f4ff2eaff8dae6823c3e318f5067f263862 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/base/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe11c31d008ee9b276f6052372bdc626d16a701cdf1947ad80c85b98f14d222 +size 130590718 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/base/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/base/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b8e22d3f566527f9f1b636382d5fb18a1ed96ef --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/base/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c22297d6cd10afa836a0f8ed7f985a1150a0ff624a545f3ad08d1520da8310a +size 385972880 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f8df63f97e99440f6c5219bdef66d059478b8d32 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97342a310dbc630125f56df35c06c239961b66666196e795402a10ca58c62630 +size 111249166 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ca5e2d49fbec28da936110191fa5e879de1371d9 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff4f38e18be4f5aefc9978a18270488d2daf4ebc333c0ddde7727f7a11902b00 +size 107066903 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cbc91c3cf66c96c53d801100257c8c89c101153f --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd019a858a6fda8cc27f3eb10ad89245627f6d46ee60f0bbf1ec01b902b38c14 +size 174664675 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e6caa426c258224df79cf466c09f15efd4a356a7 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96e61081775590eeca9e1aa1a326d4444ba8346473af55ee0737dba2bd6ffd2c +size 120278494 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..219710c263d13534b02bc3103c3a291b3eea753a --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz1024_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1da75927a2e704c0b216bb5b912546a927b094f6f531365d6c4a934ac14695e6 +size 319896065 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..09342a63d5859dee764e757015bae9e1a8f0140f --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f79ffba89b8b029e6ee18e254eada50e9e3b1cefeb8ed00539dd06afa24334b4 +size 124860222 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2b3924e1a8fdc5d4aeff78b2364eaedb9a4b7898 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5664be34738bd3bfea7fe0763a7cd9f64129e02894bd5289b437b6031f3592fd +size 112853914 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a8877af70178636010a62f936dada4bfbf0a8fba --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20f49a6df37331b3958115b861d3b7ee1af3816a240d1ef83e57bffa741e0c78 +size 172807174 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a82edc3cb6e8195b9935cdd5538b549d3a64e941 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10f34dcedd2f57b53650ba3d4e5585e59de8f198dcb9ad9b38bb6837796b1d0 +size 115562935 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cdd3fb488e17f39e2821ba3fd61837d27cf79a1e --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6a5125db307ce2ec15b2bd411179a1cbb087069e58429178845977d6475fd7e +size 340772553 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c20a5ee555c3df605a5bce03870b0d414ebf3e11 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c35c64d4eb29cc5e7ea3cb7080e7ed56253159f9c04d7adbd75617aa7eb38d1 +size 132828679 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25eb73f9ee7a3bfba9cb97baf9eb42984f64a46f --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a94cec5b41d892dda27ad806ff3381ce58ec71912f8b1d533c6b50d981eaec +size 122212942 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a4c9aef14ec13fc29259d8835b774bc9a010d897 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a3ba438477486e728800259b35467b159cb5a49c28b4aee87c92d302e7a778 +size 198468214 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3381788a02d8db06b186caa0c0076a2cdf73d830 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2256e2888a28b6b1477095cfced533b630d0db62825b8ed016e6b2ba880a69c2 +size 131626762 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cfc4b8896b654112b1ae2c6d55023124e6518d35 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz16_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e245621f2394afdbbd6442d476016eeca531eb6d32fa515818e16bc400c7c4bc +size 373933963 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fb964280de6037383ffe0db21ec90498ad2e59b2 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e57b01dc8aa0bad8e77d38c0f62bae86d64c022b4c475814a8bb9f81b24bcb +size 142102866 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..91aa35549735ef8cd95de8ed39927a5feeafcc48 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3671db271b0087985bcccdbaba228753d42167b2ccbff3d39602e15f39659f +size 129380094 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1101cf9b4cae46b4eecc8ce83883fb1fdae41376 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df2b8342d91856fc7ff019b81cd491db4461a55c1dc41033414e5d48bb792c4 +size 200262752 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..56eb30a553f1ec51cf6f7a3af489034b45713b2a --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:716edc30b68920c7739b0db787e489a76233dc713078f3434e40f8ab02d6d30e +size 128987061 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8bc8ac1feb2ec2ca2eb1b1cd4888d61cde4c6695 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz2048_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4224d8548eb2e1c1eb70ed6796205f17d0f6b0a28518a2abb9f57a87b80e22d4 +size 393364768 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ad677c503dd5397b234348324a886ab4d046d092 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862bd47d9562d21df809a44b31ba3abcb3b4488192fa7e8f21fe4e022bfd3c16 +size 145092038 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7046694921c68c791cfa81a23d2f189e7363895d --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecc655e9fe24662635a027a93f8ab89df3d878fc0b4d40bd29563ca435b3f003 +size 130887555 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7a14957edc5c813af2de42d53023ef6897a99b81 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d5d18a73902ba2a6b211f34f7b08203258ce3ac9989e5f27b3c9b5006a8f674 +size 206351473 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..89221709d63b42dc0fa83dd892599f75c1d9fcfd --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c416bc63b14cc214fdf3f98e5245b2127fb3cc87629c26e3e3db6d66cda122 +size 135350080 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c7117c27f512a03d004bb06f70c965f58aedb27f --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23435a84a93bd4646bd965d9c2f04a72da6af63fc8740e14bbef82ff78f7a81f +size 396198607 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bc22c45d7e540e34a832fe6e3c436e4b95c2e75f --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87d0c57aee92428b658d26a8777c2a3d1b1456be6c48895fad41f5cb767b549 +size 136181509 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a28211a2af0e8ac32df2d1ef2a68ac67a5d9bb71 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183dd66c25d6314ca95d00b3c3a9898fefc8751885e835b80eb87002052f255b +size 134265955 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..500fb3dff3b572119387860d27b371491254390f --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85dc0d454dfaceff321c4d7516a26bfee21afad9505c6fc106eab9d10d6049a +size 224213247 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d63fbb78cb71d7e66cdd9c333e0ebacdc7e4ed9c --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd36dc9b9d004e05950bcf00d3e79f6ce9df620a28ef7011c3b326fb93cf784 +size 147719777 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8999777d4dfa8685a9e1c4c3d3621da60e433856 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz32_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55556b4e9cb615bb72f19cc7d8fc54bad6db9ee839652bf3c2b1d1a9e36bf473 +size 395678730 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..529cd825fb7c69ee33b232bbb0b160c9cf92c9c3 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b489d90ae2babfd2edf1dab4a878eb02897a10e80dcf5445a940e2a53606d6 +size 162793775 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d48ab5ba71ee3203873065ddf7d0747e468dc324 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3637c3a7a6566f77b7096cd5eca50ae3ed7156ca97587aa38e0499619290a0 +size 152454768 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e7186f075e2cc6da9b2b0dad1b3e72df7fdae5ae --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1ad24c65e6e5374ab615da6fc166b428f6e486fd33a01230444d5691bc8cfb +size 226631860 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2fdc8607bd639a3233ee4e8185a861cd971cce67 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b043ad953d6da94c812d4ff08fd5d60c49bb178328311f62a95a72fc8aa1bbd +size 147164712 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d6da798ef06d9b83442e77b6a678e6a11fa75261 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a5f58bdcad2fed654a1ce7cead8d1be9f57078739f2e19d3b567b84e0d9bcd +size 448269684 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e6439c040b9478fe50419396d60f45029056e234 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122a35d076c3f7fcebcc505a2d77f6bcd7edd89ff516eb6a1a690bfa0d3b3367 +size 134215778 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c1fdc86af9d97d11d500c8bcfa80ab2a90ebc053 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7ed5814844e982a13a7916297ee292cafa001233990c9a76c84d053b8897b71 +size 122043193 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..99709e3829812839a257e11a2051779b951508f4 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde0b0cb840ab0c20a207b7b4bca409778d45b3e5889d679607417b17a06a8ee +size 191578630 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..400aa3c0f6be80df1477a11ad3ec3942a78943b8 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2e91e0c9ad64fb249e1a125552991842d1670b8c8ed21668c050d0509d59385 +size 125266066 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f719631c136f94c1b5ab6c504af05fd5d23c4286 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_bsz64_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4a554c4d66733a952da1529178d3f46233bb52c40bb726e3808849dbed0771 +size 358212527 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..63d6b91c2207b9dc041c87f90d4633d15d81b065 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa02f1adfc9d0699b4af8e09e8ef68a40b9dbdd9a8833446bc22701afddcd28e +size 125615690 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4711156b7b0b222a2bf079f44b29553cbebf8863 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1587fc443627bb5eb623a4e6d1afcf2ffb7b4e99fa943536696c119c58dade11 +size 120214955 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..34bc3be23623ccdbf21a7cd5eed1028f8304839b --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1df8fdc497bf1669db77e78db76881836d33a9d0fbfe159a0d94808623b75d0 +size 193686408 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..86ebf3b638fc0ba64531ce47c8988f05cc280a7c --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fc005d11badcca0fcb6d80d332db43c464f65b30fc0c6787947f064b99bcd28 +size 127202709 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..19b54bb5214a71e23079d2732ccfed7d6af6708a --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbbb8a7cb9dcae2d410e1b94064ac649fdc4e6bc7a719bd44686fe9777b5c7cf +size 350349479 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fb7d656cfb2de77c5f9a2e052bc23335d3c90606 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d3a69659209cf80d8937ae3e75a28e0fffe514a59846e31ac5b0a5ada9cec61 +size 134740817 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..36569cce702048467488cb7072d5ab818dd3d304 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f171c790c19a143725a51e8887e21177b0391ddfb6515e402d335fecfc48ea5 +size 123127717 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8fb7eafafede3cbb93ce8907bf364c60d30c7a59 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814814c34df22db4ac9b9ab5316c426a7dffb9bb008ca5b334ff6dae90026bc4 +size 190408516 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b35caed331f8403b2360cbd26e7a43540c5aedff --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6cf74abc5ac208bd1bbf0b227ab52a7ffe7b91fccbb61a2b21cdb9896cf8b2b +size 123184030 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4132b378f5a8c3900fad7fe6f5a434c7f81ce697 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_justrl_plus_plus_step512_rmsprop/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7b0581ae6e4e93c024f53faed7747fe534f1a95ed1abbc5fb04d9fde5729d85 +size 369314836 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7c867c3ca6f2bc2d1abe059c4161d54e1ebd02e6 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e3e061e25f339c73e597a7f7f24f842bac70ac90589a8bfbce637d0e4f3a158 +size 140572159 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8ed2e46c8c74c896b130aa6f42c286dd9389c773 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59bc8775a81ac07674c13a016e45893b2fb6ec574b1118c559fce3c70610225f +size 125454512 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2616fa05b9fa78e272622573fb5ba4399da108b3 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3789f4a8583652abbf665a1128814216f5e7d8bc5215e40dbbe20cea3c06177f +size 200419524 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..449d1eb5f4bb76fcd1e832f4ce79310b7d42c327 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26cd5bab57bece5713a328575ccd374546f109fb0bdc5b0b8951afdfc54ec6ce +size 132872016 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6e7449ee67f9e0ed570b775224d781cd6f254850 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz128_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71d811c83a7ac010ad0f639301b28398c430f61f91b45cc5c8264502f2c9161f +size 386875847 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..09ec614fc198cbdf76f353078034075319bb1a34 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de46238be1aa580bc4d637292632f9bd7783630ac01af716f9b58545fc34d7a7 +size 140272838 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..19daf14eccb048c244955af62ab9673c4618c871 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75e1658107f232150a1d7ff3c854378ce55c11e0b8e5512cd975ece655096d6 +size 129034324 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7ccb6d9bdd134c2126aa095baebd29bb9fb1ac6e --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5cb26f974c43f3c498eedeaa6c9dfceeb38934428ff462d31fa83543eaf3e4c +size 200039126 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5d642ec3ca1b972976df6df906bad75e50e00983 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd79ab739224dc1135cab4e6a284950edd5965f52a9edf704e14aa9cf17aa4be +size 129421540 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..83f369c17f4d413e8609b8f732c53b2de1114cdb --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz256_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aff247f9840ac51a4bf9518855e618fdd2e1afa596d05aeab2ab438f2f3d13f +size 384581745 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..94941f89be1a55648aec587c5620428016b95044 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d3686713188eab6968233986cbe049a7fca4499b05bc83ce4f403fc702f367f +size 140448795 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ff664f2d3806bb86846e2cd2a0da09505111874a --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28a7dcc49b837fab21d8a0eefc209e5170981e58ed5b8f866f3b02b6bb37ed05 +size 128140729 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3be2254e3d872c3ffd3fd706d52d3fad840f8522 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4cd347411edc3ec37a2da0918e266d24a241780f9e7b28902b08a22b7e70d0d +size 196283030 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..191e792f644486bd5cf275de19696d0ca8d76300 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5cdff9c4b9b90a8471f6dccd1a083a05b5ff3811fb619686d1acdeecf14fe14 +size 130577677 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6f9a642b78023734ad8a1b6c6a2e4f58db28782d --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz2_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bfe04c624b5e822eedc00a493b77bc3d91a0d7e5980aa414812c90c154f28c4 +size 386839720 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1a2effc8b75cbed818195bb1a2e5a4ff37913261 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9196f566df67b56720d2b60dae1aef481d0e4dda9be0a0c3e0907b2aed6c7136 +size 141410972 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7c489f0cc00a007beb9d627c581927ae6a51c479 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a695da77cbeabcc3e71f430ae0bde2078faeffb562a585066e523b5f6f579c +size 129370441 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a35ebbafab555b1dcb4552f5f74d5d8f43fee607 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58dd47bea063e114645c091240f4b60a165a493eacab27e4ac02ebeb9ac2a74f +size 200602368 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a1f39764f626cc422b1f4b65f34897a216f485a2 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ccf3bdbcf7708f10d28285e428bef1982ac202b0ea25daca6a61317039613de +size 129625734 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..42fb4f2e4a4a109824ca658835f50ffc96a6e50d --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz4_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24adf3662a4124d98f15b9549cab6dfccd57f12ed0b60e6e2b53c75831fffb93 +size 389777899 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b6c988506f7f8cb90990119a8662d68934c1e55 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz512_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc8fc48422ed726073728a4516f5c8f91d83cce79ce5f4543ac67f25f5169e3 +size 2381942382 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..efa7f67343f5c8c0309905897b3cd782992db02b --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime24_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23a39934273b69ef0db94dbee7e29a674856b55bfa385d7370bb97c64004ee7c +size 143895621 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cc0d94a276f3c640d2bb841f55d98773a06d7787 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/aime25_t0.6_p0.95_n1280-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f92593cbf41506740f510a6f566c50b68733154a6314b4ee6176c79da57901e +size 130550932 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..364bdecc5874fae0fd48630b2adaa0ebf0390bdc --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/math-500_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:914bc8df17834cdb2ad5efc8465daf2b5f7721438d0d88d3b15fac94bc625e71 +size 212003665 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ae02eba434c47f1f9f8e9fad483797168344d207 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/minerva_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bb57ebf9627a789d57acb7771d89fde1827fd2a290a4f8c8223844329cddd12 +size 138598131 diff --git a/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dd44ab655905a83d240e0b6247369f4abfaeb329 --- /dev/null +++ b/gen_outputs/Qwen2.5-3B-Instruct/step512/full_polaris_rollout_sz8_step512_adamw/olympiad-bench_t0.6_p0.95_n192-MNT4096.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2b0c367ffe55f87db08870dbb22ee1b2426ea0d598409478d6748855eaba43f +size 398985809