Update README.md
Browse files
README.md
CHANGED
@@ -3,6 +3,7 @@ base_model: Sunshine279/gammaPO-llama-3-8b-instruct
|
|
3 |
tags:
|
4 |
- alignment-handbook
|
5 |
- generated_from_trainer
|
|
|
6 |
datasets:
|
7 |
- princeton-nlp/llama3-ultrafeedback-armorm
|
8 |
model-index:
|
|
|
3 |
tags:
|
4 |
- alignment-handbook
|
5 |
- generated_from_trainer
|
6 |
+
- arxiv:2506.03690
|
7 |
datasets:
|
8 |
- princeton-nlp/llama3-ultrafeedback-armorm
|
9 |
model-index:
|