sthenno's picture
Update README.md
c707d0c verified
|
raw
history blame
216 Bytes
metadata
license: apache-2.0
datasets:
  - nvidia/HelpSteer2
language:
  - en
  - zh
metrics:
  - accuracy
base_model:
  - sthenno/tempesthenno-14b-nuslerp-0111
  - sthenno/tempesthenno-hs2-rm
tags:
  - RLHF
  - PPO
  - custom-research