Update README.md
Browse files
README.md
CHANGED
|
@@ -173,3 +173,51 @@ with torch.no_grad():
|
|
| 173 |
)
|
| 174 |
|
| 175 |
print(tokenizer.decode(outputs[0], skip_special_tokens=True))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 173 |
)
|
| 174 |
|
| 175 |
print(tokenizer.decode(outputs[0], skip_special_tokens=True))
|
| 176 |
+
|
| 177 |
+
## Citations
|
| 178 |
+
|
| 179 |
+
@misc{shao2024deepseekmathpushinglimitsmathematical,
|
| 180 |
+
title={DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models},
|
| 181 |
+
author={Zhihong Shao and Peiyi Wang and Qihao Zhu and Junxiao Song and Daya Guo and et al.},
|
| 182 |
+
year={2024},
|
| 183 |
+
eprint={2402.03300},
|
| 184 |
+
archivePrefix={arXiv},
|
| 185 |
+
primaryClass={cs.CL},
|
| 186 |
+
url={https://arxiv.org/abs/2402.03300}
|
| 187 |
+
}
|
| 188 |
+
|
| 189 |
+
@misc{qwen_qwen25_2025,
|
| 190 |
+
title={Qwen2.5 Technical Report},
|
| 191 |
+
author={Qwen and Yang, An and Yang, Baosong and Zhang, Beichen and Hui, Binyuan and et al.},
|
| 192 |
+
year={2024},
|
| 193 |
+
eprint={2412.15115},
|
| 194 |
+
archivePrefix={arXiv},
|
| 195 |
+
primaryClass={cs.CL},
|
| 196 |
+
url={https://arxiv.org/abs/2412.15115}
|
| 197 |
+
}
|
| 198 |
+
|
| 199 |
+
@misc{eval-harness,
|
| 200 |
+
author={Gao, Leo and Tow, Jonathan and Abbasi, Baber and Biderman, Stella and Black, Sid and et al.},
|
| 201 |
+
title={A framework for few-shot language model evaluation},
|
| 202 |
+
month={12},
|
| 203 |
+
year={2023},
|
| 204 |
+
publisher={Zenodo},
|
| 205 |
+
version={v0.4.0},
|
| 206 |
+
doi={10.5281/zenodo.10257521},
|
| 207 |
+
url={https://github.com/EleutherAI/lm-evaluation-harness}
|
| 208 |
+
}
|
| 209 |
+
|
| 210 |
+
@article{allenai:arc,
|
| 211 |
+
author = {Peter Clark and Isaac Cowhey and Oren Etzioni and Tushar Khot and
|
| 212 |
+
Ashish Sabharwal and Carissa Schoenick and Oyvind Tafjord},
|
| 213 |
+
title = {Think you have Solved Question Answering? Try ARC, the AI2 Reasoning Challenge},
|
| 214 |
+
journal = {arXiv:1803.05457v1},
|
| 215 |
+
year = {2018},
|
| 216 |
+
}
|
| 217 |
+
|
| 218 |
+
@article{cobbe2021gsm8k,
|
| 219 |
+
title={Training Verifiers to Solve Math Word Problems},
|
| 220 |
+
author={Cobbe, Karl and Kosaraju, Vineet and Bavarian, Mohammad and Chen, Mark and Jun, Heewoo and Kaiser, Lukasz and Plappert, Matthias and Tworek, Jerry and Hilton, Jacob and Nakano, Reiichiro and Hesse, Christopher and Schulman, John},
|
| 221 |
+
journal={arXiv preprint arXiv:2110.14168},
|
| 222 |
+
year={2021}
|
| 223 |
+
}
|