Update README.md
Browse files
README.md
CHANGED
@@ -112,9 +112,9 @@ print(text_outputs[0])
|
|
112 |
## Citation
|
113 |
|
114 |
```
|
115 |
-
@article{
|
116 |
-
title={Unified
|
117 |
-
author={Wang, Yibin and Li, Zhimin and Zang, Yuhang and Wang, Chunyu and Lu, Qinglin
|
118 |
journal={arXiv preprint arXiv:2505.03318},
|
119 |
year={2025}
|
120 |
}
|
|
|
112 |
## Citation
|
113 |
|
114 |
```
|
115 |
+
@article{unifiedreward-think,
|
116 |
+
title={Unified multimodal chain-of-thought reward model through reinforcement fine-tuning},
|
117 |
+
author={Wang, Yibin and Li, Zhimin and Zang, Yuhang and Wang, Chunyu and Lu, Qinglin and Jin, Cheng and Wang, Jiaqi},
|
118 |
journal={arXiv preprint arXiv:2505.03318},
|
119 |
year={2025}
|
120 |
}
|