CharlieFRuan
commited on
Commit
•
a10f84d
1
Parent(s):
a7511a9
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- added_tokens.json +4 -0
- logs.txt +0 -0
- mlc-chat-config.json +43 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|im_end|>": 32000,
|
3 |
+
"<|im_start|>": 32001
|
4 |
+
}
|
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "mistral",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 14336,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 32002,
|
11 |
+
"position_embedding_base": 10000.0,
|
12 |
+
"context_window_size": -1,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"sliding_window_size": 4096,
|
16 |
+
"prefill_chunk_size": 4096,
|
17 |
+
"attention_sink_size": 4,
|
18 |
+
"tensor_parallel_shards": 1
|
19 |
+
},
|
20 |
+
"vocab_size": 32002,
|
21 |
+
"context_window_size": -1,
|
22 |
+
"sliding_window_size": 4096,
|
23 |
+
"prefill_chunk_size": 4096,
|
24 |
+
"attention_sink_size": 4,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"mean_gen_len": 128,
|
27 |
+
"max_gen_len": 512,
|
28 |
+
"shift_fill_factor": 0.3,
|
29 |
+
"temperature": 0.7,
|
30 |
+
"repetition_penalty": 1.0,
|
31 |
+
"top_p": 0.95,
|
32 |
+
"conv_template": "neural_hermes_mistral",
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"bos_token_id": 1,
|
35 |
+
"eos_token_id": 32000,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.model",
|
38 |
+
"tokenizer.json",
|
39 |
+
"added_tokens.json",
|
40 |
+
"tokenizer_config.json"
|
41 |
+
],
|
42 |
+
"version": "0.1.0"
|
43 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49a1006b4268434107493fa3ed60cc811c83615736edf2b4f0cd4ed625fb8881
|
3 |
+
size 65540096
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37899d1396a4ce7bb9e2447f1a226cb00a3893ac69490a0baa95e2c873deccb9
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:742ff1448c124b903aa7762e4feca668052676804b8ccbb643260cdbd87ddf96
|
3 |
+
size 30949376
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9f5f467d188355fb9ad668562ce03db44936a38b5f8636653e596e39477a415
|
3 |
+
size 27271168
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e73858c6e8ea97da2ebd605dbec2bef527e243e7693765f92ef336c97273700
|
3 |
+
size 29360128
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02b9486f6c0c41cd83fbbfbd24c39106d23c5a5731d2eaef75af9d66f97d5fa1
|
3 |
+
size 30949376
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dacee8b81b924441ca71f864183fd939ab9f57b807bf1270fbefd5fc976b6a6
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8061a5b0523c5a8004fb1b3e5f7286e663995e4550edc1e6d9d1255905c3aef
|
3 |
+
size 25174016
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2041f67b4b8ad01ca32a1f886d799b199bcf432c58853764ad00a3ca15f44083
|
3 |
+
size 33030144
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67c9d19bdf3f177ca9539da7c31118d3cc65670f80bc3f1a57f1f1ba367447c3
|
3 |
+
size 58720256
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:319e3693d8b9df84db0cf0e6028ed020163abf2fda4a052b9f7958d5b036570d
|
3 |
+
size 25174016
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c4fd2c26c4a5901390913497ab74610f1c68140da3534c45e2e593af37609ea
|
3 |
+
size 29360128
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a35f8f893088a325054fec08e6aa46bbcbcbff30bf6b64dda216e9f02cd4263d
|
3 |
+
size 58720256
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb2fe626e44ac45b9cf106ada8636d0fa5d04d72ff9603d29c51d610f8edb8c3
|
3 |
+
size 33046528
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b4a50d679170694afd96b895935668c84da85942cfe7829046efe22bbe64c56
|
3 |
+
size 29360128
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f51c29a93311d48f4a4bece1f765d2a208e51a1fd6341b33f6cc27245c641ef
|
3 |
+
size 58720256
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d35179a56c7300e0f7a4464fd5075ab7d65ddec3317d28df4492c6b2496087
|
3 |
+
size 22036480
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff58f1f90a1d44653e3d52024a4d66cbce029f536257166d0008d704d3f18a06
|
3 |
+
size 29360128
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73d7fa0fa8043980b5bfe9047266c6ad9ff80cb09948a26a166e36c34377d2c0
|
3 |
+
size 58720256
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92807653031ac20072a26d56b09da9ec92c6c55d2e21424d91b8f05f0e1e7cee
|
3 |
+
size 58720256
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afd1c03979a83533332d8ba71a1dda0f2136d04892d701b1b3d8d1efd257ceea
|
3 |
+
size 27271168
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6492de90e2b3024e70fb033e399b67f38fb32609b969c1ec7cc56fdb37aacee
|
3 |
+
size 29360128
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d485a080fdbfa4aaa12b6868ba9f9513ffae0b25f16e8ca190c9d8ea225137
|
3 |
+
size 30949376
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f719d34f7e63ce33577bc31d8f8bf574d5829fea3642bc30974706261830f12
|
3 |
+
size 58720256
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be93b78252794aef3a13204062d7a2ec4e1bd10d5a18c1355a51e7bb9f6ca32a
|
3 |
+
size 25174016
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b9533c7db356bd62d94055ba0b0b4326c016354712e28f867258cf1ccc2cf39
|
3 |
+
size 29360128
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bee57b6a40d60bbf5ecefb359728f00b37c9e9a252db12ab9ce78c2f8c63725
|
3 |
+
size 58720256
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3c705ed60338291ebe8314d9d91283530e49015d3cba629e2df19d6909931ca
|
3 |
+
size 33046528
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39ee0a8d91e8e5e0602d2c01be3dc00d3c79a704b3096ac388454daff4330d4b
|
3 |
+
size 29360128
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5b0f62921c94510aed6fc8762e6e782db1761988022adaaf4b5f4e4ee5fcbbc
|
3 |
+
size 29360128
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb71f456d3caceb21429cfb9cd93593016374dea3000272a04b0af5058b90c63
|
3 |
+
size 58720256
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adf28074d3e9b79216e887fa03092d06e13c376b255e952acb15cd0ebae40667
|
3 |
+
size 22036480
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32af1089e3181f4630d8f9e2335bd9ccfd9d64bb54c55cb458202cc7f6a6bacb
|
3 |
+
size 65540096
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f01c8d10254c93a350fa9f24dc3104dd38f295e9dba4b6091e8f7869bad55fe
|
3 |
+
size 29360128
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64dd4e9784873aa69a40b8b14c02bda7dab6f107f66c72e02cf2c2c0c9f4dbc7
|
3 |
+
size 31801856
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9bb89c9b775d5ebb8752a5ba0bb94b3bceae78d1480d63d511d33ded55561a1
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b109deba0aba3493048b245b88ed00b112f53799960bc730ad983f01cb56dc20
|
3 |
+
size 25174016
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:848ad8fc299d8951e72a824d47d7742225eac4ca2e65d3a58e6306059ad2bc61
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21611ee93c05233f519f8e115ded366f08752eaa6985669e01f7f02868e0e45d
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bd336830393123123e49748f19d8be1e3e7044fbb7457d83004887fb313667f
|
3 |
+
size 33046528
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7df99739b158845e71ae79380722eb272597b33ab3e21dfc53bc91ff6f78f708
|
3 |
+
size 58720256
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2c30ffc49b89da1dfcd405db0529fd13dd3eba02920088a198e9bb2a13e2832
|
3 |
+
size 58720256
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2ddaea5d0750c1869d1999d0f5e206283ff047cdac5736aa66677888d895c11
|
3 |
+
size 32505856
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ad327fa9c2bbd574ec8a93038b209f19c6147d732bcfa6e734ae0576909b0e4
|
3 |
+
size 29360128
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10cada196d2b99bb993a617f71c176a19652d083df931053235f7cb564b92c36
|
3 |
+
size 58720256
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2d8b39cca1549b6fb612d63a75a59004ce60d3b837f6f6aa993f855a27f0079
|
3 |
+
size 33046528
|