Update README.md
Browse files
README.md
CHANGED
@@ -46,7 +46,7 @@ This repository provides a Japanese GPT-NeoX model of 3.6 billion parameters.
|
|
46 |
| 3.6B SFT | https://huggingface.co/rinna/japanese-gpt-neox-3.6b-instruction-sft |
|
47 |
| 3.6B pretrained | https://huggingface.co/rinna/japanese-gpt-neox-3.6b |
|
48 |
|
49 |
-
* **
|
50 |
|
51 |
[Tianyu Zhao](https://huggingface.co/tianyuz) and [Kei Sawada](https://huggingface.co/keisawada)
|
52 |
|
@@ -109,5 +109,23 @@ The model uses a [sentencepiece](https://github.com/google/sentencepiece)-based
|
|
109 |
# 'ααααα [UNK]ααα εΎθΌ©γ― η«γ§γγ </s>'
|
110 |
~~~
|
111 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
112 |
# Licenese
|
113 |
[The MIT license](https://opensource.org/licenses/MIT)
|
|
|
46 |
| 3.6B SFT | https://huggingface.co/rinna/japanese-gpt-neox-3.6b-instruction-sft |
|
47 |
| 3.6B pretrained | https://huggingface.co/rinna/japanese-gpt-neox-3.6b |
|
48 |
|
49 |
+
* **Contributors**
|
50 |
|
51 |
[Tianyu Zhao](https://huggingface.co/tianyuz) and [Kei Sawada](https://huggingface.co/keisawada)
|
52 |
|
|
|
109 |
# 'ααααα [UNK]ααα εΎθΌ©γ― η«γ§γγ </s>'
|
110 |
~~~
|
111 |
|
112 |
+
# How to cite
|
113 |
+
~~~
|
114 |
+
@misc{rinna-japanese-gpt-neox-3.6b,
|
115 |
+
title = {rinna/japanese-gpt-neox-3.6b},
|
116 |
+
author = {Zhao, Tianyu and Sawada, Kei}
|
117 |
+
url = {https://huggingface.co/rinna/japanese-gpt-neox-3.6b},
|
118 |
+
}
|
119 |
+
|
120 |
+
@inproceedings{sawada2024release,
|
121 |
+
title = {Release of Pre-Trained Models for the {J}apanese Language},
|
122 |
+
author = {Sawada, Kei and Zhao, Tianyu and Shing, Makoto and Mitsui, Kentaro and Kaga, Akio and Hono, Yukiya and Wakatsuki, Toshiaki and Mitsuda, Koh},
|
123 |
+
booktitle = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
|
124 |
+
month = {5},
|
125 |
+
year = {2024},
|
126 |
+
url = {https://arxiv.org/abs/2404.01657},
|
127 |
+
}
|
128 |
+
~~~
|
129 |
+
|
130 |
# Licenese
|
131 |
[The MIT license](https://opensource.org/licenses/MIT)
|