Update README.md
Browse files
README.md
CHANGED
@@ -2,8 +2,6 @@
|
|
2 |
language: ja
|
3 |
thumbnail: https://github.com/rinnakk/japanese-pretrained-models/blob/master/rinna.png
|
4 |
tags:
|
5 |
-
- ja
|
6 |
-
- japanese
|
7 |
- gpt-neox
|
8 |
- text-generation
|
9 |
- lm
|
@@ -63,11 +61,11 @@ Here are a few samples generated with and without the toy prefix weights, respec
|
|
63 |
After version 5.1, [NVIDIA FasterTransformer](https://github.com/NVIDIA/FasterTransformer) now supports both inference for GPT-NeoX and a variety of soft prompts (including prefix-tuning). The released pretrained model and prefix weights in this repo have been verified to work with FasterTransformer 5.1.
|
64 |
|
65 |
# How to cite
|
66 |
-
|
67 |
@misc{rinna-japanese-gpt-neox-small,
|
68 |
title = {rinna/japanese-gpt-neox-small},
|
69 |
-
author = {Zhao, Tianyu and Sawada, Kei}
|
70 |
-
url = {https://huggingface.co/rinna/japanese-gpt-neox-small}
|
71 |
}
|
72 |
|
73 |
@inproceedings{sawada2024release,
|
@@ -76,9 +74,11 @@ After version 5.1, [NVIDIA FasterTransformer](https://github.com/NVIDIA/FasterTr
|
|
76 |
booktitle = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
|
77 |
month = {5},
|
78 |
year = {2024},
|
79 |
-
|
|
|
|
|
80 |
}
|
81 |
-
|
82 |
|
83 |
# Licenese
|
84 |
[The MIT license](https://opensource.org/licenses/MIT)
|
|
|
2 |
language: ja
|
3 |
thumbnail: https://github.com/rinnakk/japanese-pretrained-models/blob/master/rinna.png
|
4 |
tags:
|
|
|
|
|
5 |
- gpt-neox
|
6 |
- text-generation
|
7 |
- lm
|
|
|
61 |
After version 5.1, [NVIDIA FasterTransformer](https://github.com/NVIDIA/FasterTransformer) now supports both inference for GPT-NeoX and a variety of soft prompts (including prefix-tuning). The released pretrained model and prefix weights in this repo have been verified to work with FasterTransformer 5.1.
|
62 |
|
63 |
# How to cite
|
64 |
+
```bibtex
|
65 |
@misc{rinna-japanese-gpt-neox-small,
|
66 |
title = {rinna/japanese-gpt-neox-small},
|
67 |
+
author = {Zhao, Tianyu and Sawada, Kei},
|
68 |
+
url = {https://huggingface.co/rinna/japanese-gpt-neox-small}
|
69 |
}
|
70 |
|
71 |
@inproceedings{sawada2024release,
|
|
|
74 |
booktitle = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
|
75 |
month = {5},
|
76 |
year = {2024},
|
77 |
+
pages = {13898--13905},
|
78 |
+
url = {https://aclanthology.org/2024.lrec-main.1213},
|
79 |
+
note = {\url{https://arxiv.org/abs/2404.01657}}
|
80 |
}
|
81 |
+
```
|
82 |
|
83 |
# Licenese
|
84 |
[The MIT license](https://opensource.org/licenses/MIT)
|