license: apache-2.0 | |
datasets: | |
- nvidia/HelpSteer2 | |
language: | |
- en | |
- zh | |
metrics: | |
- accuracy | |
base_model: | |
- sthenno/tempesthenno-14b-nuslerp-0111 | |
- sthenno/tempesthenno-hs2-rm | |
tags: | |
- RLHF | |
- PPO | |
- custom-research | |
license: apache-2.0 | |
datasets: | |
- nvidia/HelpSteer2 | |
language: | |
- en | |
- zh | |
metrics: | |
- accuracy | |
base_model: | |
- sthenno/tempesthenno-14b-nuslerp-0111 | |
- sthenno/tempesthenno-hs2-rm | |
tags: | |
- RLHF | |
- PPO | |
- custom-research | |