DopeorNope
commited on
Commit
•
66f4b43
1
Parent(s):
93ecf77
Upload MixtralForCausalLM
Browse files- config.json +34 -0
- generation_config.json +7 -0
- model-00001-of-00044.safetensors +3 -0
- model-00002-of-00044.safetensors +3 -0
- model-00003-of-00044.safetensors +3 -0
- model-00004-of-00044.safetensors +3 -0
- model-00005-of-00044.safetensors +3 -0
- model-00006-of-00044.safetensors +3 -0
- model-00007-of-00044.safetensors +3 -0
- model-00008-of-00044.safetensors +3 -0
- model-00009-of-00044.safetensors +3 -0
- model-00010-of-00044.safetensors +3 -0
- model-00011-of-00044.safetensors +3 -0
- model-00012-of-00044.safetensors +3 -0
- model-00013-of-00044.safetensors +3 -0
- model-00014-of-00044.safetensors +3 -0
- model-00015-of-00044.safetensors +3 -0
- model-00016-of-00044.safetensors +3 -0
- model-00017-of-00044.safetensors +3 -0
- model-00018-of-00044.safetensors +3 -0
- model-00019-of-00044.safetensors +3 -0
- model-00020-of-00044.safetensors +3 -0
- model-00021-of-00044.safetensors +3 -0
- model-00022-of-00044.safetensors +3 -0
- model-00023-of-00044.safetensors +3 -0
- model-00024-of-00044.safetensors +3 -0
- model-00025-of-00044.safetensors +3 -0
- model-00026-of-00044.safetensors +3 -0
- model-00027-of-00044.safetensors +3 -0
- model-00028-of-00044.safetensors +3 -0
- model-00029-of-00044.safetensors +3 -0
- model-00030-of-00044.safetensors +3 -0
- model-00031-of-00044.safetensors +3 -0
- model-00032-of-00044.safetensors +3 -0
- model-00033-of-00044.safetensors +3 -0
- model-00034-of-00044.safetensors +3 -0
- model-00035-of-00044.safetensors +3 -0
- model-00036-of-00044.safetensors +3 -0
- model-00037-of-00044.safetensors +3 -0
- model-00038-of-00044.safetensors +3 -0
- model-00039-of-00044.safetensors +3 -0
- model-00040-of-00044.safetensors +3 -0
- model-00041-of-00044.safetensors +3 -0
- model-00042-of-00044.safetensors +3 -0
- model-00043-of-00044.safetensors +3 -0
- model-00044-of-00044.safetensors +3 -0
- model.safetensors.index.json +0 -0
config.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "solar_moe_3",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 4096,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 14336,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "mixtral",
|
16 |
+
"num_attention_heads": 32,
|
17 |
+
"num_experts_per_tok": 2,
|
18 |
+
"num_hidden_layers": 48,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"num_local_experts": 6,
|
21 |
+
"output_router_logits": false,
|
22 |
+
"pad_token_id": 2,
|
23 |
+
"pretraining_tp": 1,
|
24 |
+
"rms_norm_eps": 1e-05,
|
25 |
+
"rope_scaling": null,
|
26 |
+
"rope_theta": 10000.0,
|
27 |
+
"router_aux_loss_coef": 0.001,
|
28 |
+
"sliding_window": null,
|
29 |
+
"tie_word_embeddings": false,
|
30 |
+
"torch_dtype": "float32",
|
31 |
+
"transformers_version": "4.36.0.dev0",
|
32 |
+
"use_cache": true,
|
33 |
+
"vocab_size": 32000
|
34 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 2,
|
6 |
+
"transformers_version": "4.36.0.dev0"
|
7 |
+
}
|
model-00001-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a7f97158ab892d5a7421d084aa640dbccb3cc9abb5cbf1b9e71bbb45bd7d28c
|
3 |
+
size 4987161928
|
model-00002-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44ab382e664b5ab0394e474909caea3efcc31f6b9f6e68a860b7b75723f9d4b2
|
3 |
+
size 4966289216
|
model-00003-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83abc8cb8af127c941805668d1c6acc6bfd376ab06bb856a326c471cc0bb4e5a
|
3 |
+
size 4865527152
|
model-00004-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb48931bb6bb729f2863637c734e74a68de504b80a0a295bfcd42e27e7186976
|
3 |
+
size 4865527152
|
model-00005-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:addb639836e642107d53578a4c249b83ad176f80847590f1410ffe1e516cba88
|
3 |
+
size 4865527152
|
model-00006-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:248d7efcb825fe3a5f5cfbfd7800219db19147a20b9a4a4869e7fcce93ffed9a
|
3 |
+
size 4865527152
|
model-00007-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e5759a8f801dac28da29df94418c60ce2daf7bdbd8c6a0e5e9e757e2c487779
|
3 |
+
size 4865527152
|
model-00008-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2382c5cb986082d11e585226cd887964e1ae1f5233063707abee5bbac7adba2d
|
3 |
+
size 4865527152
|
model-00009-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7d15d96b2166e8200ab68af7eac14956a4708bc660743cb516513424bd388f9
|
3 |
+
size 4865527144
|
model-00010-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24bb1f68166bbc9b6ba57948911985ea4dedada9273830ac3e76e3e8035df5ff
|
3 |
+
size 4966223816
|
model-00011-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:531312f78076dc5ca13b6a45de50532bbd615443218d6ec1ed8feeba84e0d452
|
3 |
+
size 4932734584
|
model-00012-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0766bdeb93ebbf89e6c045be89cfd8041f0dd25de323c80e4c4aeb5853c7e374
|
3 |
+
size 4865527176
|
model-00013-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4247dbdc946bd6e74332db403a5dbffac0df5e92a2696636d57d2e016ff3b012
|
3 |
+
size 4865527176
|
model-00014-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:baff952fccd40670c725174d319f9ac142f5ddc62215a0c78932e3fe61c01fbc
|
3 |
+
size 4865527176
|
model-00015-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fa401272e8a2f2656bf2aa5ca093e592bd5c9230628953a3216d4d8e5ac0806
|
3 |
+
size 4865527176
|
model-00016-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01bea421c21b89f90c4451d0db889fc03c629f7f98d32225307188e3d5634d2f
|
3 |
+
size 4865527176
|
model-00017-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2935e2fb733c7b72bc22f6d728f12cb5e991445db80554dc7eaa39f4107f19c5
|
3 |
+
size 4865527176
|
model-00018-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50e329f234b30c0bb2b1259bd33e748f34525b1fe4e943e3c19b461416566c7e
|
3 |
+
size 4865527176
|
model-00019-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46f39c6af9e582a7d9ad676651f3748d810d9d83da02847151b76ecc26275573
|
3 |
+
size 4966223816
|
model-00020-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eefe94fed65bc4be544b5f93698637c55e6317bbb6d6e0e87b75e148ea91234
|
3 |
+
size 4932734584
|
model-00021-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:001e0a8a37fdff52dde88121dec9fcce87102989ed668f0ac4ba34b379afc067
|
3 |
+
size 4865527176
|
model-00022-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8c4b3ce5ae63a1d74d139b9b883f3e41774f691559384d8fbf22fba9341e47d
|
3 |
+
size 4865527176
|
model-00023-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7637b4f77653da5231fe97a50df43c2032ebc7aa0da6a25e64ccc785972065b1
|
3 |
+
size 4865527176
|
model-00024-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71cf12635acecd62c1295b6a1ced27eea72054661aca91e1be04305cf92b23a0
|
3 |
+
size 4865527176
|
model-00025-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32e6ef122acd31d9e9f5f568014dd1e846a37c30f82c628e12c2310e38153bf0
|
3 |
+
size 4865527176
|
model-00026-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abf9ab5b50125f690a13147e1812d4aae464e21ec0cf1d01d9e2f576c418f3b
|
3 |
+
size 4865527176
|
model-00027-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4816f59e12033c2208a96966453cb88f3bf1ba79eb62db4fb356cd5d5c982e6
|
3 |
+
size 4865527176
|
model-00028-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36583a3bccbcef08e6cdbd7095408583985a9e4181b0de4742e45469a9ab0145
|
3 |
+
size 4966223816
|
model-00029-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff23264f229e63b1e3eed9e674d9c4afb73908f06e4b08f4b6880a88feeb22aa
|
3 |
+
size 4932734584
|
model-00030-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c58b983366f1bbba13512a22a5484b23579b1b9b6b26c597a6cc7b4fc6fa224
|
3 |
+
size 4865527176
|
model-00031-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21a6905de5e32cce8e0f847993c361df8de6471b6118145d24689151838c5c04
|
3 |
+
size 4865527176
|
model-00032-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1be33703958014091502ad127202e75a08e79b3e2005986e73f4a39ecf6e2fea
|
3 |
+
size 4865527176
|
model-00033-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:733e0f88850fa1d5b7879668dc3b2e602400cc40ca4998c82d46b3f9f3f0b592
|
3 |
+
size 4865527176
|
model-00034-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea0f2aaf5a9985a79f4f55977eb31fdafbd07b21c42b071f5c3eacd2a780768
|
3 |
+
size 4865527176
|
model-00035-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c666c53a5fa2287efad4279350e2ba633d168e462bd00b4e4e76ec503aee81db
|
3 |
+
size 4865527176
|
model-00036-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca171c1d92c3dc34d8a15ea488e231e3532cdbaf46d957478cd31a2f895d2483
|
3 |
+
size 4865527176
|
model-00037-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdfadabf288d31a680d4835477bbc0548de3733acc555a22c1537eee5553590c
|
3 |
+
size 4966223816
|
model-00038-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c26a2814743022c163d40248170d819d41f3d798ff6c920964792d6bf35b643
|
3 |
+
size 4932734584
|
model-00039-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fae5190c8a89eb7183bbcf3779a1782923884bc83dd2db7483849001a12407ae
|
3 |
+
size 4865527176
|
model-00040-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:800093906370d6e66763e410095bceda6d851593042aea519c0d8af7a2d85207
|
3 |
+
size 4865527176
|
model-00041-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e724ebb6a630a8543095e4d3c5f3d4eb4c284aa55ed4b7d0d4b90c4b651d417f
|
3 |
+
size 4865527176
|
model-00042-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54a623128d911a08320f63b9051f2a48e1ec91e6f7972f2a0fff731efc483e47
|
3 |
+
size 4865527176
|
model-00043-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:137d2983a77e64bfd1b4c721aa8891158db0775f0610ce0838146ec1a9bc59a9
|
3 |
+
size 4865527176
|
model-00044-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b6cdb007966f38ce57eba46633704fc900f1304910d19d44cf8d4e548775c38
|
3 |
+
size 1933624528
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|