Update README.md
Browse files
README.md
CHANGED
|
@@ -133,4 +133,12 @@ If you find our work helpful, feel free to give us a citation.
|
|
| 133 |
journal={arXiv preprint arXiv:2412.06559},
|
| 134 |
year={2024}
|
| 135 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 136 |
```
|
|
|
|
| 133 |
journal={arXiv preprint arXiv:2412.06559},
|
| 134 |
year={2024}
|
| 135 |
}
|
| 136 |
+
@article{prmlessons,
|
| 137 |
+
title={The Lessons of Developing Process Reward Models in Mathematical Reasoning},
|
| 138 |
+
author={
|
| 139 |
+
Zhenru Zhang and Chujie Zheng and Yangzhen Wu and Beichen Zhang and Runji Lin and Bowen Yu and Dayiheng Liu and Jingren Zhou and Junyang Lin
|
| 140 |
+
},
|
| 141 |
+
journal={arXiv preprint arXiv:2501.07301},
|
| 142 |
+
year={2025}
|
| 143 |
+
}
|
| 144 |
```
|