license: apache-2.0 | |
datasets: | |
- HuggingFaceH4/ultrafeedback_binarized | |
language: | |
- en | |
library_name: transformers | |
pipeline_tag: question-answering | |
tags: | |
- humman feedback | |
- HH-RLHF | |
- PPO | |
- lama-1.3B | |
license: apache-2.0 | |
datasets: | |
- HuggingFaceH4/ultrafeedback_binarized | |
language: | |
- en | |
library_name: transformers | |
pipeline_tag: question-answering | |
tags: | |
- humman feedback | |
- HH-RLHF | |
- PPO | |
- lama-1.3B | |