Update README.md
Browse files
README.md
CHANGED
@@ -55,7 +55,7 @@ This repository provides a Japanese GPT-NeoX model of 3.6 billion parameters. Th
|
|
55 |
| 3.6B SFT | https://huggingface.co/rinna/japanese-gpt-neox-3.6b-instruction-sft |
|
56 |
| 3.6B pretrained | https://huggingface.co/rinna/japanese-gpt-neox-3.6b |
|
57 |
|
58 |
-
* **
|
59 |
|
60 |
[Tianyu Zhao](https://huggingface.co/tianyuz) and [Kei Sawada](https://huggingface.co/keisawada)
|
61 |
|
@@ -168,5 +168,23 @@ The model uses a [sentencepiece](https://github.com/google/sentencepiece)-based
|
|
168 |
# 'ααααα [UNK]ααα εΎθΌ©γ― η«γ§γγ </s>'
|
169 |
~~~
|
170 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
171 |
# Licenese
|
172 |
[The MIT license](https://opensource.org/licenses/MIT)
|
|
|
55 |
| 3.6B SFT | https://huggingface.co/rinna/japanese-gpt-neox-3.6b-instruction-sft |
|
56 |
| 3.6B pretrained | https://huggingface.co/rinna/japanese-gpt-neox-3.6b |
|
57 |
|
58 |
+
* **Contributors**
|
59 |
|
60 |
[Tianyu Zhao](https://huggingface.co/tianyuz) and [Kei Sawada](https://huggingface.co/keisawada)
|
61 |
|
|
|
168 |
# 'ααααα [UNK]ααα εΎθΌ©γ― η«γ§γγ </s>'
|
169 |
~~~
|
170 |
|
171 |
+
# How to cite
|
172 |
+
~~~
|
173 |
+
@misc{rinna-japanese-gpt-neox-3.6b-instruction-ppo,
|
174 |
+
title = {rinna/japanese-gpt-neox-3.6b-instruction-ppo},
|
175 |
+
author = {Zhao, Tianyu and Sawada, Kei}
|
176 |
+
url = {https://huggingface.co/rinna/japanese-gpt-neox-3.6b-instruction-ppo},
|
177 |
+
}
|
178 |
+
|
179 |
+
@inproceedings{sawada2024release,
|
180 |
+
title = {Release of Pre-Trained Models for the {J}apanese Language},
|
181 |
+
author = {Sawada, Kei and Zhao, Tianyu and Shing, Makoto and Mitsui, Kentaro and Kaga, Akio and Hono, Yukiya and Wakatsuki, Toshiaki and Mitsuda, Koh},
|
182 |
+
booktitle = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
|
183 |
+
month = {5},
|
184 |
+
year = {2024},
|
185 |
+
url = {https://arxiv.org/abs/2404.01657},
|
186 |
+
}
|
187 |
+
~~~
|
188 |
+
|
189 |
# Licenese
|
190 |
[The MIT license](https://opensource.org/licenses/MIT)
|