Spaces:
Running
Running
natolambert
commited on
Merge branch 'main' of https://huggingface.co/spaces/allenai/reward-bench
Browse files
app.py
CHANGED
@@ -350,7 +350,7 @@ Warning, refusals, XSTest, and donotanswer datasets have sensitive content.""")
|
|
350 |
with gr.Accordion("π Citation", open=False):
|
351 |
citation_button = gr.Textbox(
|
352 |
value=r"""@misc{RewardBench,
|
353 |
-
title={RewardBench:
|
354 |
author={Lambert, Nathan and Pyatkin, Valentina and Morrison, Jacob and Miranda, LJ and Lin, Bill Yuchen and Chandu, Khyathi and Dziri, Nouha and Kumar, Sachin and Zick, Tom and Choi, Yejin and Smith, Noah A. and Hajishirzi, Hannaneh},
|
355 |
year={2024},
|
356 |
howpublished={\url{https://huggingface.co/spaces/allenai/reward-bench}
|
|
|
350 |
with gr.Accordion("π Citation", open=False):
|
351 |
citation_button = gr.Textbox(
|
352 |
value=r"""@misc{RewardBench,
|
353 |
+
title={RewardBench: Evaluating Reward Models},
|
354 |
author={Lambert, Nathan and Pyatkin, Valentina and Morrison, Jacob and Miranda, LJ and Lin, Bill Yuchen and Chandu, Khyathi and Dziri, Nouha and Kumar, Sachin and Zick, Tom and Choi, Yejin and Smith, Noah A. and Hajishirzi, Hannaneh},
|
355 |
year={2024},
|
356 |
howpublished={\url{https://huggingface.co/spaces/allenai/reward-bench}
|
src/md.py
CHANGED
@@ -92,5 +92,5 @@ For more details, see the [dataset](https://huggingface.co/datasets/allenai/rewa
|
|
92 |
TOP_TEXT = """
|
93 |
# RewardBench: Evaluating Reward Models
|
94 |
### Evaluating the capabilities, safety, and pitfalls of reward models
|
95 |
-
[Code](https://github.com/allenai/reward-bench) | [Eval. Dataset](https://huggingface.co/datasets/allenai/reward-bench) | [
|
96 |
"""
|
|
|
92 |
TOP_TEXT = """
|
93 |
# RewardBench: Evaluating Reward Models
|
94 |
### Evaluating the capabilities, safety, and pitfalls of reward models
|
95 |
+
[Code](https://github.com/allenai/reward-bench) | [Eval. Dataset](https://huggingface.co/datasets/allenai/reward-bench) | [Prior Test Sets](https://huggingface.co/datasets/allenai/pref-test-sets) | [Results](https://huggingface.co/datasets/allenai/reward-bench-results) | Paper (coming soon)
|
96 |
"""
|