DopeorNope commited on
Commit
66f4b43
1 Parent(s): 93ecf77

Upload MixtralForCausalLM

Browse files
Files changed (47) hide show
  1. config.json +34 -0
  2. generation_config.json +7 -0
  3. model-00001-of-00044.safetensors +3 -0
  4. model-00002-of-00044.safetensors +3 -0
  5. model-00003-of-00044.safetensors +3 -0
  6. model-00004-of-00044.safetensors +3 -0
  7. model-00005-of-00044.safetensors +3 -0
  8. model-00006-of-00044.safetensors +3 -0
  9. model-00007-of-00044.safetensors +3 -0
  10. model-00008-of-00044.safetensors +3 -0
  11. model-00009-of-00044.safetensors +3 -0
  12. model-00010-of-00044.safetensors +3 -0
  13. model-00011-of-00044.safetensors +3 -0
  14. model-00012-of-00044.safetensors +3 -0
  15. model-00013-of-00044.safetensors +3 -0
  16. model-00014-of-00044.safetensors +3 -0
  17. model-00015-of-00044.safetensors +3 -0
  18. model-00016-of-00044.safetensors +3 -0
  19. model-00017-of-00044.safetensors +3 -0
  20. model-00018-of-00044.safetensors +3 -0
  21. model-00019-of-00044.safetensors +3 -0
  22. model-00020-of-00044.safetensors +3 -0
  23. model-00021-of-00044.safetensors +3 -0
  24. model-00022-of-00044.safetensors +3 -0
  25. model-00023-of-00044.safetensors +3 -0
  26. model-00024-of-00044.safetensors +3 -0
  27. model-00025-of-00044.safetensors +3 -0
  28. model-00026-of-00044.safetensors +3 -0
  29. model-00027-of-00044.safetensors +3 -0
  30. model-00028-of-00044.safetensors +3 -0
  31. model-00029-of-00044.safetensors +3 -0
  32. model-00030-of-00044.safetensors +3 -0
  33. model-00031-of-00044.safetensors +3 -0
  34. model-00032-of-00044.safetensors +3 -0
  35. model-00033-of-00044.safetensors +3 -0
  36. model-00034-of-00044.safetensors +3 -0
  37. model-00035-of-00044.safetensors +3 -0
  38. model-00036-of-00044.safetensors +3 -0
  39. model-00037-of-00044.safetensors +3 -0
  40. model-00038-of-00044.safetensors +3 -0
  41. model-00039-of-00044.safetensors +3 -0
  42. model-00040-of-00044.safetensors +3 -0
  43. model-00041-of-00044.safetensors +3 -0
  44. model-00042-of-00044.safetensors +3 -0
  45. model-00043-of-00044.safetensors +3 -0
  46. model-00044-of-00044.safetensors +3 -0
  47. model.safetensors.index.json +0 -0
config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "solar_moe_3",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 4096,
15
+ "model_type": "mixtral",
16
+ "num_attention_heads": 32,
17
+ "num_experts_per_tok": 2,
18
+ "num_hidden_layers": 48,
19
+ "num_key_value_heads": 8,
20
+ "num_local_experts": 6,
21
+ "output_router_logits": false,
22
+ "pad_token_id": 2,
23
+ "pretraining_tp": 1,
24
+ "rms_norm_eps": 1e-05,
25
+ "rope_scaling": null,
26
+ "rope_theta": 10000.0,
27
+ "router_aux_loss_coef": 0.001,
28
+ "sliding_window": null,
29
+ "tie_word_embeddings": false,
30
+ "torch_dtype": "float32",
31
+ "transformers_version": "4.36.0.dev0",
32
+ "use_cache": true,
33
+ "vocab_size": 32000
34
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "pad_token_id": 2,
6
+ "transformers_version": "4.36.0.dev0"
7
+ }
model-00001-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a7f97158ab892d5a7421d084aa640dbccb3cc9abb5cbf1b9e71bbb45bd7d28c
3
+ size 4987161928
model-00002-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44ab382e664b5ab0394e474909caea3efcc31f6b9f6e68a860b7b75723f9d4b2
3
+ size 4966289216
model-00003-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83abc8cb8af127c941805668d1c6acc6bfd376ab06bb856a326c471cc0bb4e5a
3
+ size 4865527152
model-00004-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb48931bb6bb729f2863637c734e74a68de504b80a0a295bfcd42e27e7186976
3
+ size 4865527152
model-00005-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:addb639836e642107d53578a4c249b83ad176f80847590f1410ffe1e516cba88
3
+ size 4865527152
model-00006-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:248d7efcb825fe3a5f5cfbfd7800219db19147a20b9a4a4869e7fcce93ffed9a
3
+ size 4865527152
model-00007-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e5759a8f801dac28da29df94418c60ce2daf7bdbd8c6a0e5e9e757e2c487779
3
+ size 4865527152
model-00008-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2382c5cb986082d11e585226cd887964e1ae1f5233063707abee5bbac7adba2d
3
+ size 4865527152
model-00009-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7d15d96b2166e8200ab68af7eac14956a4708bc660743cb516513424bd388f9
3
+ size 4865527144
model-00010-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24bb1f68166bbc9b6ba57948911985ea4dedada9273830ac3e76e3e8035df5ff
3
+ size 4966223816
model-00011-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:531312f78076dc5ca13b6a45de50532bbd615443218d6ec1ed8feeba84e0d452
3
+ size 4932734584
model-00012-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0766bdeb93ebbf89e6c045be89cfd8041f0dd25de323c80e4c4aeb5853c7e374
3
+ size 4865527176
model-00013-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4247dbdc946bd6e74332db403a5dbffac0df5e92a2696636d57d2e016ff3b012
3
+ size 4865527176
model-00014-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baff952fccd40670c725174d319f9ac142f5ddc62215a0c78932e3fe61c01fbc
3
+ size 4865527176
model-00015-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fa401272e8a2f2656bf2aa5ca093e592bd5c9230628953a3216d4d8e5ac0806
3
+ size 4865527176
model-00016-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01bea421c21b89f90c4451d0db889fc03c629f7f98d32225307188e3d5634d2f
3
+ size 4865527176
model-00017-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2935e2fb733c7b72bc22f6d728f12cb5e991445db80554dc7eaa39f4107f19c5
3
+ size 4865527176
model-00018-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50e329f234b30c0bb2b1259bd33e748f34525b1fe4e943e3c19b461416566c7e
3
+ size 4865527176
model-00019-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46f39c6af9e582a7d9ad676651f3748d810d9d83da02847151b76ecc26275573
3
+ size 4966223816
model-00020-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eefe94fed65bc4be544b5f93698637c55e6317bbb6d6e0e87b75e148ea91234
3
+ size 4932734584
model-00021-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:001e0a8a37fdff52dde88121dec9fcce87102989ed668f0ac4ba34b379afc067
3
+ size 4865527176
model-00022-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8c4b3ce5ae63a1d74d139b9b883f3e41774f691559384d8fbf22fba9341e47d
3
+ size 4865527176
model-00023-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7637b4f77653da5231fe97a50df43c2032ebc7aa0da6a25e64ccc785972065b1
3
+ size 4865527176
model-00024-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71cf12635acecd62c1295b6a1ced27eea72054661aca91e1be04305cf92b23a0
3
+ size 4865527176
model-00025-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32e6ef122acd31d9e9f5f568014dd1e846a37c30f82c628e12c2310e38153bf0
3
+ size 4865527176
model-00026-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abf9ab5b50125f690a13147e1812d4aae464e21ec0cf1d01d9e2f576c418f3b
3
+ size 4865527176
model-00027-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4816f59e12033c2208a96966453cb88f3bf1ba79eb62db4fb356cd5d5c982e6
3
+ size 4865527176
model-00028-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36583a3bccbcef08e6cdbd7095408583985a9e4181b0de4742e45469a9ab0145
3
+ size 4966223816
model-00029-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff23264f229e63b1e3eed9e674d9c4afb73908f06e4b08f4b6880a88feeb22aa
3
+ size 4932734584
model-00030-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c58b983366f1bbba13512a22a5484b23579b1b9b6b26c597a6cc7b4fc6fa224
3
+ size 4865527176
model-00031-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21a6905de5e32cce8e0f847993c361df8de6471b6118145d24689151838c5c04
3
+ size 4865527176
model-00032-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1be33703958014091502ad127202e75a08e79b3e2005986e73f4a39ecf6e2fea
3
+ size 4865527176
model-00033-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:733e0f88850fa1d5b7879668dc3b2e602400cc40ca4998c82d46b3f9f3f0b592
3
+ size 4865527176
model-00034-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dea0f2aaf5a9985a79f4f55977eb31fdafbd07b21c42b071f5c3eacd2a780768
3
+ size 4865527176
model-00035-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c666c53a5fa2287efad4279350e2ba633d168e462bd00b4e4e76ec503aee81db
3
+ size 4865527176
model-00036-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca171c1d92c3dc34d8a15ea488e231e3532cdbaf46d957478cd31a2f895d2483
3
+ size 4865527176
model-00037-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdfadabf288d31a680d4835477bbc0548de3733acc555a22c1537eee5553590c
3
+ size 4966223816
model-00038-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c26a2814743022c163d40248170d819d41f3d798ff6c920964792d6bf35b643
3
+ size 4932734584
model-00039-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fae5190c8a89eb7183bbcf3779a1782923884bc83dd2db7483849001a12407ae
3
+ size 4865527176
model-00040-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:800093906370d6e66763e410095bceda6d851593042aea519c0d8af7a2d85207
3
+ size 4865527176
model-00041-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e724ebb6a630a8543095e4d3c5f3d4eb4c284aa55ed4b7d0d4b90c4b651d417f
3
+ size 4865527176
model-00042-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54a623128d911a08320f63b9051f2a48e1ec91e6f7972f2a0fff731efc483e47
3
+ size 4865527176
model-00043-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:137d2983a77e64bfd1b4c721aa8891158db0775f0610ce0838146ec1a9bc59a9
3
+ size 4865527176
model-00044-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b6cdb007966f38ce57eba46633704fc900f1304910d19d44cf8d4e548775c38
3
+ size 1933624528
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff