Update README.md
Browse files
README.md
CHANGED
@@ -2,8 +2,6 @@
|
|
2 |
language: ja
|
3 |
thumbnail: https://github.com/rinnakk/japanese-pretrained-models/blob/master/rinna.png
|
4 |
tags:
|
5 |
-
- ja
|
6 |
-
- japanese
|
7 |
- gpt
|
8 |
- text-generation
|
9 |
- lm
|
@@ -67,11 +65,11 @@ The model was trained on [Japanese C4](https://huggingface.co/datasets/allenai/c
|
|
67 |
The model uses a [sentencepiece](https://github.com/google/sentencepiece)-based tokenizer. The vocabulary was first trained on a selected subset from the training data using the official sentencepiece training script, and then augmented with emojis and symbols.
|
68 |
|
69 |
# How to cite
|
70 |
-
|
71 |
@misc{rinna-japanese-gpt-1b,
|
72 |
title = {rinna/japanese-gpt-1b},
|
73 |
-
author = {Zhao, Tianyu and Sawada, Kei}
|
74 |
-
url = {https://huggingface.co/rinna/japanese-gpt-1b}
|
75 |
}
|
76 |
|
77 |
@inproceedings{sawada2024release,
|
@@ -80,9 +78,11 @@ The model uses a [sentencepiece](https://github.com/google/sentencepiece)-based
|
|
80 |
booktitle = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
|
81 |
month = {5},
|
82 |
year = {2024},
|
83 |
-
|
|
|
|
|
84 |
}
|
85 |
-
|
86 |
|
87 |
# Licenese
|
88 |
[The MIT license](https://opensource.org/licenses/MIT)
|
|
|
2 |
language: ja
|
3 |
thumbnail: https://github.com/rinnakk/japanese-pretrained-models/blob/master/rinna.png
|
4 |
tags:
|
|
|
|
|
5 |
- gpt
|
6 |
- text-generation
|
7 |
- lm
|
|
|
65 |
The model uses a [sentencepiece](https://github.com/google/sentencepiece)-based tokenizer. The vocabulary was first trained on a selected subset from the training data using the official sentencepiece training script, and then augmented with emojis and symbols.
|
66 |
|
67 |
# How to cite
|
68 |
+
```bibtex
|
69 |
@misc{rinna-japanese-gpt-1b,
|
70 |
title = {rinna/japanese-gpt-1b},
|
71 |
+
author = {Zhao, Tianyu and Sawada, Kei},
|
72 |
+
url = {https://huggingface.co/rinna/japanese-gpt-1b}
|
73 |
}
|
74 |
|
75 |
@inproceedings{sawada2024release,
|
|
|
78 |
booktitle = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
|
79 |
month = {5},
|
80 |
year = {2024},
|
81 |
+
pages = {13898--13905},
|
82 |
+
url = {https://aclanthology.org/2024.lrec-main.1213},
|
83 |
+
note = {\url{https://arxiv.org/abs/2404.01657}}
|
84 |
}
|
85 |
+
```
|
86 |
|
87 |
# Licenese
|
88 |
[The MIT license](https://opensource.org/licenses/MIT)
|