sehyun66's picture
Create README.md
da9c395 verified
|
raw
history blame
204 Bytes
metadata
license: apache-2.0
datasets:
  - HuggingFaceH4/ultrafeedback_binarized
language:
  - en
library_name: transformers
pipeline_tag: question-answering
tags:
  - humman feedback
  - HH-RLHF
  - PPO
  - lama-1.3B