Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +34 -0
- generation_config.json +7 -0
- model-00001-of-00201.safetensors +3 -0
- model-00002-of-00201.safetensors +3 -0
- model-00003-of-00201.safetensors +3 -0
- model-00004-of-00201.safetensors +3 -0
- model-00005-of-00201.safetensors +3 -0
- model-00006-of-00201.safetensors +3 -0
- model-00007-of-00201.safetensors +3 -0
- model-00008-of-00201.safetensors +3 -0
- model-00009-of-00201.safetensors +3 -0
- model-00010-of-00201.safetensors +3 -0
- model-00011-of-00201.safetensors +3 -0
- model-00012-of-00201.safetensors +3 -0
- model-00013-of-00201.safetensors +3 -0
- model-00014-of-00201.safetensors +3 -0
- model-00015-of-00201.safetensors +3 -0
- model-00016-of-00201.safetensors +3 -0
- model-00017-of-00201.safetensors +3 -0
- model-00018-of-00201.safetensors +3 -0
- model-00019-of-00201.safetensors +3 -0
- model-00020-of-00201.safetensors +3 -0
- model-00021-of-00201.safetensors +3 -0
- model-00022-of-00201.safetensors +3 -0
- model-00023-of-00201.safetensors +3 -0
- model-00024-of-00201.safetensors +3 -0
- model-00025-of-00201.safetensors +3 -0
- model-00026-of-00201.safetensors +3 -0
- model-00027-of-00201.safetensors +3 -0
- model-00028-of-00201.safetensors +3 -0
- model-00029-of-00201.safetensors +3 -0
- model-00030-of-00201.safetensors +3 -0
- model-00031-of-00201.safetensors +3 -0
- model-00032-of-00201.safetensors +3 -0
- model-00033-of-00201.safetensors +3 -0
- model-00034-of-00201.safetensors +3 -0
- model-00035-of-00201.safetensors +3 -0
- model-00036-of-00201.safetensors +3 -0
- model-00037-of-00201.safetensors +3 -0
- model-00038-of-00201.safetensors +3 -0
- model-00039-of-00201.safetensors +3 -0
- model-00040-of-00201.safetensors +3 -0
- model-00041-of-00201.safetensors +3 -0
- model-00042-of-00201.safetensors +3 -0
- model-00043-of-00201.safetensors +3 -0
- model-00044-of-00201.safetensors +3 -0
- model-00045-of-00201.safetensors +3 -0
- model-00046-of-00201.safetensors +3 -0
- model-00047-of-00201.safetensors +3 -0
- model-00048-of-00201.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "basemodels/llama-2-3x70b-chat-hf",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 2048,
|
15 |
+
"model_type": "mixtral",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_experts_per_tok": 2,
|
18 |
+
"num_hidden_layers": 80,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"num_local_experts": 3,
|
21 |
+
"output_router_logits": false,
|
22 |
+
"pad_token_id": 0,
|
23 |
+
"pretraining_tp": 1,
|
24 |
+
"rms_norm_eps": 1e-05,
|
25 |
+
"rope_scaling": null,
|
26 |
+
"rope_theta": 10000.0,
|
27 |
+
"router_aux_loss_coef": 0.001,
|
28 |
+
"sliding_window": null,
|
29 |
+
"tie_word_embeddings": false,
|
30 |
+
"torch_dtype": "bfloat16",
|
31 |
+
"transformers_version": "4.37.0.dev0",
|
32 |
+
"use_cache": true,
|
33 |
+
"vocab_size": 32000
|
34 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.37.0.dev0"
|
7 |
+
}
|
model-00001-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc2d964de3fb392e869f9cbd9fcc1fccf3e3b03a91d6b59376b0054ae4f81db8
|
3 |
+
size 1765852120
|
model-00002-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3421e1140f66c3f313d83c0b07e3fdf9b23f5bf69c3c464c979c833a6d239562
|
3 |
+
size 1879048744
|
model-00003-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6dd937412b36e67fbe8b913b16bb80fd86f30707e017e0d8f80ff477c7132e5
|
3 |
+
size 1711359192
|
model-00004-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd8d8b22c8913b47026cddf21020cafb1baa030c44f462ab5185a11d75757987
|
3 |
+
size 1879048744
|
model-00005-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e19a14064ffbd2e349bd294f2d51f1c3500b64bf302e346d50dac969c16587d5
|
3 |
+
size 1879048744
|
model-00006-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c2266c38ba94579e7178c0b6206e61e20bcabe802b87960e76d8cf5b09c4441
|
3 |
+
size 1711359192
|
model-00007-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:895e107faa6326548d096f8c51ecbf47f5dfa31a245501a6b9aa06210874e92f
|
3 |
+
size 1879048744
|
model-00008-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:878cba7bbac60590b2fe21013424ca4afbfbec5bcee00b6c45bf1d49c332b0ec
|
3 |
+
size 1711359192
|
model-00009-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7673e95bf46bb0b598d34a57577fc90693315e73522b7356b85c5ef7b7679aa0
|
3 |
+
size 1879048744
|
model-00010-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d053f160390702ffff022c4302ff63c50fec282b4ef74e3a83f4ce6585f8074a
|
3 |
+
size 1879048744
|
model-00011-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:969700a8196aa8fd3bb671ef9aa2588619268a5bc823cab8c9a2ba6a23ce9300
|
3 |
+
size 1711359192
|
model-00012-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67dc76051803762fdd13b344a860699b856ca16458b1bd8d83cb7be76f3d4cd5
|
3 |
+
size 1879048744
|
model-00013-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50b22cdaa80390e57a3e7743ed5de6e684dfa2e61993eeda8a270fad2c098326
|
3 |
+
size 1711359192
|
model-00014-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:353d57f6c35cfdd90f534d4fdc536bddeb606178a12619d3249b691deb3ed909
|
3 |
+
size 1879048744
|
model-00015-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fcb4114b6b165b13d537d1674d8b6a1320e1ebce27680593d874af37a0e0158
|
3 |
+
size 1879048744
|
model-00016-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d5336bc96a67d179e2a95ba42d8171f44570a5d56331eb3e04fa6b70f3e2417
|
3 |
+
size 1711359192
|
model-00017-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82449f1e37b146d2756edde885f5e919171802907dc917c72489459f64ef6472
|
3 |
+
size 1879048744
|
model-00018-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82206fde2d9c189388b12d1e4c7b1139aedeb54aeb260b8f4e52c06a9f1e9f00
|
3 |
+
size 1711359192
|
model-00019-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20313c0f5312c179156a6db667c24d34c4eff2637ea95f4aa1fae42deefa215f
|
3 |
+
size 1879048744
|
model-00020-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c021a71e9f88944d1a7e80751995b30bcda7e6a4a0c84d24d319db4a5666d2fe
|
3 |
+
size 1879048744
|
model-00021-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c267740320572476257fa53f163a6ba218cbccf901f9cfb742814eee1a53568e
|
3 |
+
size 1711359192
|
model-00022-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e84bfbb751d6be8e2461a03dc570a35362a54a59644441801a7828c9f115902f
|
3 |
+
size 1879048744
|
model-00023-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcfe862bae36eef552584ec05e3065bcf0f5c325f2b601d5a7661c363f313173
|
3 |
+
size 1711359192
|
model-00024-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0cdb32ece4f5ed5caf476c4c40d0eb5425f3a792d3230e3a60fa1268e3ef4cf
|
3 |
+
size 1879048744
|
model-00025-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:947f9e218127f729b96006bfe508590c917f20ff9757a1ea5439b465da4bc65a
|
3 |
+
size 1879048744
|
model-00026-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56c3cfc71383101f413b04626ad9961d32c68d0816456ad03a9ddd5611556595
|
3 |
+
size 1711359200
|
model-00027-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c4d1c23186aa9dfcde44f6304e95785e24271ed38a826871f5762dbd379443f
|
3 |
+
size 1879048752
|
model-00028-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6517755053db0630d4f2112c87fb75fb5d56792d84d6b12b6cc7eb8a525f461f
|
3 |
+
size 1711359200
|
model-00029-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:428ddaa00ef2f02055a2e245775a4c17df741c03def737514966d55c089a6d0b
|
3 |
+
size 1879048752
|
model-00030-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01b87f49fdf24c2a09e60eceb09d05f0dce8aac9597253c65d3127cffad52597
|
3 |
+
size 1879048752
|
model-00031-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dc2d67dbbc6a6f9ccfb57c8743cd8327abf9cc7cce305bb2d6e1e5a91eb6faa
|
3 |
+
size 1711359200
|
model-00032-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc417773d71cb6724fb777930b261ba5c1abefbbb254352d1e0c3e16195dbe6f
|
3 |
+
size 1879048752
|
model-00033-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:051797c6badb86e768bf44d9dfa53d1bfd278d006197b5477cd5c2ace13433f6
|
3 |
+
size 1711359200
|
model-00034-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb1f6cbe2f6de2d01ad697e7f91bbbb106096ee9c7b1e8e9a5b4e3c394235182
|
3 |
+
size 1879048752
|
model-00035-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf8b93ea5a06baf78e16881d540d027c34206a90e33966ca7095b9dc29f5b421
|
3 |
+
size 1879048752
|
model-00036-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35a0ef36b77ea9d2f996cfe6b528f827ecf6a20767363257f8f7a1807ef8db4c
|
3 |
+
size 1711359200
|
model-00037-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:889ba1d73e977127fd4e63751411506e34f3e0bb6086a89f6d3fc98e3d17bc4a
|
3 |
+
size 1879048752
|
model-00038-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d22d31279aeea3afd0315dbb709b125a53ad008cdfbb6738308e86dd639d74d
|
3 |
+
size 1711359200
|
model-00039-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f473550e342eac6e4b6e6b53ad50b14567d8aa496823ecb63297261bbb83e576
|
3 |
+
size 1879048752
|
model-00040-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f1e13f7c3acbb11ea1fa7abff6c31dcbf989ad9cc6de0abab21987ba1a50940
|
3 |
+
size 1879048752
|
model-00041-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7182209af2e4415ce0e10926eb193991f4981d83372bcf1dee73f0ceaa2c717
|
3 |
+
size 1711359200
|
model-00042-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3c2a3ca4cfdb3796dd3612e140d2ad9dc341ef70dc12d55d91a4a4e90bf133f
|
3 |
+
size 1879048752
|
model-00043-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b50b94e300cbc110b37b3ccf603fd3c332a989fae7929c4563e1d346002ab08
|
3 |
+
size 1711359200
|
model-00044-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8870a479b3bfe1e7171bd6b7a58835590e19e5737cf8a3fe0f42b75a8d299504
|
3 |
+
size 1879048752
|
model-00045-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdae91ded39049fcde82b782ab6483a32c1ba3aa494407aeecb110d2a2a463fb
|
3 |
+
size 1879048752
|
model-00046-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6c573ff796ee761c5900330d6dec5035721c77aef401fdd88fe53abebe9384c
|
3 |
+
size 1711359200
|
model-00047-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:307279987bae94f8e5a6dac5c2745f92544e346c9cb33be79629a58f8f14737f
|
3 |
+
size 1879048752
|
model-00048-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9d3d0d3c1a7aa748dbc167aec23fdbc20ea5a1b5f3dd0c489f3526e1a6ea972
|
3 |
+
size 1711359200
|