Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +87 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_140.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 8192,
|
7 |
+
"intermediate_size": 28672,
|
8 |
+
"num_attention_heads": 64,
|
9 |
+
"num_hidden_layers": 80,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": {
|
15 |
+
"factor": 8.0,
|
16 |
+
"high_freq_factor": 4.0,
|
17 |
+
"low_freq_factor": 1.0,
|
18 |
+
"original_max_position_embeddings": 8192,
|
19 |
+
"rope_type": "llama3"
|
20 |
+
},
|
21 |
+
"context_window_size": 131072,
|
22 |
+
"prefill_chunk_size": 8192,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"head_dim": 128,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"pipeline_parallel_stages": 1,
|
27 |
+
"max_batch_size": 128,
|
28 |
+
"disaggregation": false
|
29 |
+
},
|
30 |
+
"vocab_size": 128256,
|
31 |
+
"context_window_size": 131072,
|
32 |
+
"sliding_window_size": -1,
|
33 |
+
"prefill_chunk_size": 8192,
|
34 |
+
"attention_sink_size": -1,
|
35 |
+
"tensor_parallel_shards": 1,
|
36 |
+
"pipeline_parallel_stages": 1,
|
37 |
+
"temperature": 1.0,
|
38 |
+
"presence_penalty": 0.0,
|
39 |
+
"frequency_penalty": 0.0,
|
40 |
+
"repetition_penalty": 1.0,
|
41 |
+
"top_p": 1.0,
|
42 |
+
"tokenizer_files": [
|
43 |
+
"tokenizer.json",
|
44 |
+
"tokenizer_config.json"
|
45 |
+
],
|
46 |
+
"tokenizer_info": {
|
47 |
+
"token_postproc_method": "byte_level",
|
48 |
+
"prepend_space_in_encode": false,
|
49 |
+
"strip_space_in_decode": false
|
50 |
+
},
|
51 |
+
"conv_template": {
|
52 |
+
"name": "deepseek_v3",
|
53 |
+
"system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
|
54 |
+
"system_message": "You are a helpful assistant.",
|
55 |
+
"system_prefix_token_ids": null,
|
56 |
+
"add_role_after_system_message": true,
|
57 |
+
"roles": {
|
58 |
+
"user": "<\uff5cUser\uff5c>",
|
59 |
+
"assistant": "<\uff5cAssistant\uff5c>"
|
60 |
+
},
|
61 |
+
"role_templates": {
|
62 |
+
"user": "{user_message}",
|
63 |
+
"assistant": "{assistant_message}",
|
64 |
+
"tool": "{tool_message}"
|
65 |
+
},
|
66 |
+
"messages": [],
|
67 |
+
"seps": [
|
68 |
+
"",
|
69 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
70 |
+
],
|
71 |
+
"role_content_sep": "",
|
72 |
+
"role_empty_sep": "",
|
73 |
+
"stop_str": [],
|
74 |
+
"stop_token_ids": [
|
75 |
+
151643
|
76 |
+
],
|
77 |
+
"function_string": "",
|
78 |
+
"use_function_calling": false
|
79 |
+
},
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"bos_token_id": 128000,
|
82 |
+
"eos_token_id": [
|
83 |
+
128001,
|
84 |
+
128008,
|
85 |
+
128009
|
86 |
+
]
|
87 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:722a52071153f271780f0e859832fc44b61eb8fde560207eb83aa955a08a9f0c
|
3 |
+
size 2101346304
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf4dc6a3720bae1934b699bfa0b5dc1604656b7c19852ad8569918cdd3d7bec1
|
3 |
+
size 167772160
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d57ede7bb1be550135713466d5479dc63e5c8ed4544fea38fde2e29d8c9a06de
|
3 |
+
size 134217728
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d46dc2c49404224eaba269675f3f45e20e5508a3d1e7973d5d8ddd4fced5afea
|
3 |
+
size 469762048
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39f09a4b2367254d8502d8a033e3f0231280b551b90bb4ae8577de508fd28654
|
3 |
+
size 167772160
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d89d6580716182dd9c73c95b758cd8d25a3f20d1bde4a5a7177fcbdc57e33255
|
3 |
+
size 134217728
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f78b90168f2a7c9003b319dce928e765957e1ebc3f7d22868ab31e8680820b20
|
3 |
+
size 939524096
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96d61d4c5408b28fed476d5f78c93b7ce1e0e1c3f2ab2ebb4dfaa9b428a517aa
|
3 |
+
size 469762048
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e061261a95e1cc7583b5d9179d9ffffdeb030c12e3b965b940ab5327543b0c84
|
3 |
+
size 167772160
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f88d3a72e65e2bcc135fb30d720f57c626e098222f2c699f8d0a70410ee5af6
|
3 |
+
size 134217728
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:887c4d33198f1d88095ae7107842f678a88bdf7d66d7c3f2529e9cd0f0bc8aa3
|
3 |
+
size 939524096
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e77bb18e481f1eae2cf936c7ba933aedb5ac1bef89b804ca941448c14304e8e6
|
3 |
+
size 469762048
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:543e3f9ca9f4ce59c0ae450e246dcc18edb14c858106da2b15f2a07fd138f9c1
|
3 |
+
size 167772160
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5227a11124f9335372416212c237f4f5ebb33bf23f9d9b733f724d4282c541ac
|
3 |
+
size 939524096
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e920f1425f14cb5f2ce1da2278255bcceda06186c111d2b4ef95ffb9aa2a157
|
3 |
+
size 134217728
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19aa95b87ac4d6810e8028652016fa0dce0a0570cc7fe51d907dc284783ff117
|
3 |
+
size 939524096
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df3732d29d9fd0387076256dd3506b03b59f74c1a77cbd776d8529119a44f9e4
|
3 |
+
size 469762048
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad0dedf41b8accaa6ea8c2dcedd3b1a0dbe886e4fd94fe26b6616d7037c0f600
|
3 |
+
size 167772160
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f2f17a98822afc1893072da82c6c0def5f5750213a53d5a767b63e43a7d6672
|
3 |
+
size 134217728
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a11caf4f8acbca673ff9d41accb6700c29845705dc7019ac1557527eb00773d1
|
3 |
+
size 939524096
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06ed09b007972df0ac3e5e55dc99b02b09337a7af39b0cb631df8a55990a7899
|
3 |
+
size 469762048
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4279c662433fb2fd339f5a42cd204c37ad2b96901e0f610d8a9b9bbec6b33d67
|
3 |
+
size 167772160
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc084f2bede07976ca66d577998aacd338ebbbbeef3fdbf243a5d9ff4ffe6ac7
|
3 |
+
size 134217728
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa2dde11842362095b9df331e38c6f75e90368b8bdb6ddf1c0d7a77bd0376a36
|
3 |
+
size 939524096
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e67fe7bb49d069ac1b8c7bd7adeae7eac17ca6d2d7a54bd795c8d415b30b079
|
3 |
+
size 469762048
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64777ec0770cab97783f57bb610e889c65fbf48d860fa511059193933a48c030
|
3 |
+
size 469762048
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b95046f966869800e32bb3707a8e55a469c1f79c057795aed6bc5e174928670b
|
3 |
+
size 167772160
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2dfd2b9e23aca2c15d1ba7915b9bee55cb23e033869986aec5d4f62f737a109f
|
3 |
+
size 134217728
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a67200c28bea95e7d37a29e0981d2dc4c67fb498860899a3e0285f9f1240d704
|
3 |
+
size 939524096
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1eb8bebe906aa9e3d6ae8ccecb3916a6a4e9fca34b5dffe8eb50989ebe86aba9
|
3 |
+
size 469762048
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ead0b64399c90c8afc07f0acef0154d1f07171f040d20ec1b8eaeb9861e8a89
|
3 |
+
size 167772160
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b8afcae04c7ded66b0b7e56d26cc22510b3bc5f822025d97b5b1f7784ea2102
|
3 |
+
size 134217728
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02c1dcedc0c8d6c8cb089ca12522516febf6909144195348709c030aa1598419
|
3 |
+
size 939524096
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6482cda8c3fafef1841670156d062936b45b30ce3db13b54fa06496494599aec
|
3 |
+
size 469762048
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8562691e12f66215b5e735c25f056d78bbea35fcebea311762c6cbbc29c14c8
|
3 |
+
size 167772160
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a592a55063eeb0b318f217d26c9a82e7c17e8ef290ebf90fdb52c77f283808c
|
3 |
+
size 167772160
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1af62e4577a04580f80d0e5f4385e0c3c91a4e2615ff0146f737a0c220665f0
|
3 |
+
size 134217728
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:588070c3085e8e65820122ca825e4c3a373e7e040b652daf1edf052aab7015b2
|
3 |
+
size 939524096
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72dd7a83f40ba89a4b31fd3dd2c36e1b528ebf6fd7ed0def37ed2d9199bcc17b
|
3 |
+
size 469762048
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e80e15653a75b30bd861bc764e7324607e1afd385b3dfabcc2d2462de2063ee
|
3 |
+
size 167772160
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9ba4ee4d7d72117a8674585f3b88629ae09e6fe3f9c2dbc51fc942c938ad292
|
3 |
+
size 134217728
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89ad20b44e8d575f4dbf221783e01e0498cd60957080ddc8734e520c7f2efcd7
|
3 |
+
size 939524096
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92208f7ad548e56c98f357f857b547e909c03d322ad76b55c510b3367c4be9b9
|
3 |
+
size 469762048
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdf434840ce251f0602bfb8053f2e937eac58110b449a5a16cfd940aa148c358
|
3 |
+
size 167772160
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b3f87aaadd4fa4e0d7dddeeda99f65428ead03f5ac4cc7d3223c13a869ad668
|
3 |
+
size 134217728
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ccaf504d41ea436d4e0bffb2d9a8073899027038bd048e1bc347dfdad889f4a
|
3 |
+
size 939524096
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9067ed3830b7596e641f32147e8f1df4488d30ca5e2ff421b3bd1ec813cd8757
|
3 |
+
size 134217728
|
params_shard_140.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:164bad18522840292c7153423d34314f0914145aa79b64c02db1c96ca93cb98e
|
3 |
+
size 469762048
|