Update README.md
Browse files
README.md
CHANGED
@@ -4,13 +4,13 @@ language:
|
|
4 |
- en
|
5 |
pipeline_tag: text-generation
|
6 |
tags:
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
library_name:
|
14 |
---
|
15 |
|
16 |
# An Empirical Study of Mamba-based Language Models
|
@@ -44,4 +44,4 @@ Please cite the paper as follows if you use the models from this repo:
|
|
44 |
year = {2024},
|
45 |
journal = {arXiv preprint arXiv: 2406.07887}
|
46 |
}
|
47 |
-
```
|
|
|
4 |
- en
|
5 |
pipeline_tag: text-generation
|
6 |
tags:
|
7 |
+
- nvidia
|
8 |
+
- Megatron-LM
|
9 |
+
- Mamba
|
10 |
+
- Mamba-2
|
11 |
+
- SSM
|
12 |
+
- 8B
|
13 |
+
library_name: transformers
|
14 |
---
|
15 |
|
16 |
# An Empirical Study of Mamba-based Language Models
|
|
|
44 |
year = {2024},
|
45 |
journal = {arXiv preprint arXiv: 2406.07887}
|
46 |
}
|
47 |
+
```
|