metadata
license: apache-2.0
datasets:
- nvidia/HelpSteer2
language:
- en
- zh
metrics:
- accuracy
base_model:
- sthenno/tempesthenno-14b-nuslerp-0111
- sthenno/tempesthenno-hs2-rm
tags:
- RLHF
- PPO
- custom-research
license: apache-2.0
datasets:
- nvidia/HelpSteer2
language:
- en
- zh
metrics:
- accuracy
base_model:
- sthenno/tempesthenno-14b-nuslerp-0111
- sthenno/tempesthenno-hs2-rm
tags:
- RLHF
- PPO
- custom-research