Update README.md
Browse files
README.md
CHANGED
|
@@ -114,9 +114,9 @@ print(output)
|
|
| 114 |
## Citation
|
| 115 |
|
| 116 |
```
|
| 117 |
-
@article{
|
| 118 |
-
title={Unified
|
| 119 |
-
author={Wang, Yibin and Li, Zhimin and Zang, Yuhang and Wang, Chunyu and Lu, Qinglin
|
| 120 |
journal={arXiv preprint arXiv:2505.03318},
|
| 121 |
year={2025}
|
| 122 |
}
|
|
|
|
| 114 |
## Citation
|
| 115 |
|
| 116 |
```
|
| 117 |
+
@article{unifiedreward-think,
|
| 118 |
+
title={Unified multimodal chain-of-thought reward model through reinforcement fine-tuning},
|
| 119 |
+
author={Wang, Yibin and Li, Zhimin and Zang, Yuhang and Wang, Chunyu and Lu, Qinglin and Jin, Cheng and Wang, Jiaqi},
|
| 120 |
journal={arXiv preprint arXiv:2505.03318},
|
| 121 |
year={2025}
|
| 122 |
}
|