scottto commited on
Commit
2f7dffd
1 Parent(s): bfe56ec

llama 3.1 8b q4f16_1

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
mlc-chat-config.json ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "llama",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_size": 4096,
7
+ "intermediate_size": 14336,
8
+ "num_attention_heads": 32,
9
+ "num_hidden_layers": 32,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 128256,
12
+ "tie_word_embeddings": false,
13
+ "position_embedding_base": 500000.0,
14
+ "context_window_size": 131072,
15
+ "prefill_chunk_size": 2048,
16
+ "num_key_value_heads": 8,
17
+ "head_dim": 128,
18
+ "tensor_parallel_shards": 1,
19
+ "max_batch_size": 80
20
+ },
21
+ "vocab_size": 128256,
22
+ "context_window_size": 131072,
23
+ "sliding_window_size": -1,
24
+ "prefill_chunk_size": 2048,
25
+ "attention_sink_size": -1,
26
+ "tensor_parallel_shards": 1,
27
+ "temperature": 0.6,
28
+ "presence_penalty": 0.0,
29
+ "frequency_penalty": 0.0,
30
+ "repetition_penalty": 1.0,
31
+ "top_p": 0.9,
32
+ "tokenizer_files": [
33
+ "tokenizer.json",
34
+ "tokenizer_config.json"
35
+ ],
36
+ "tokenizer_info": {
37
+ "token_postproc_method": "byte_level",
38
+ "prepend_space_in_encode": false,
39
+ "strip_space_in_decode": false
40
+ },
41
+ "conv_template": {
42
+ "name": "llama-2",
43
+ "system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
44
+ "system_message": "You are a helpful, respectful and honest assistant.",
45
+ "system_prefix_token_ids": [
46
+ 1
47
+ ],
48
+ "add_role_after_system_message": false,
49
+ "roles": {
50
+ "user": "<s>[INST]",
51
+ "assistant": "[/INST]",
52
+ "tool": "[INST]"
53
+ },
54
+ "role_templates": {
55
+ "user": "{user_message}",
56
+ "assistant": "{assistant_message}",
57
+ "tool": "{tool_message}"
58
+ },
59
+ "messages": [],
60
+ "seps": [
61
+ " ",
62
+ " </s>"
63
+ ],
64
+ "role_content_sep": " ",
65
+ "role_empty_sep": " ",
66
+ "stop_str": [
67
+ "[INST]"
68
+ ],
69
+ "stop_token_ids": [
70
+ 2
71
+ ],
72
+ "function_string": "",
73
+ "use_function_calling": false
74
+ },
75
+ "pad_token_id": 0,
76
+ "bos_token_id": 128000,
77
+ "eos_token_id": 128001
78
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db76a88f4c434aa384119adbebd8f7d8b56193853565e28b91ae2d536ed06824
3
+ size 262668288
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08e6f1eb7c8be4e40137f35f916531ea775f8f74956bd3e44dbd8fe3ac807e8b
3
+ size 29360128
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d92dc2075df18f3a20afc5012c16b57576219f8d23a1fef8ed6355433cb7491a
3
+ size 33046528
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b7564ba46e1758aefb93e6184d77302958525a2df7c1f7e505df5aa4f4b6971
3
+ size 58720256
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efdac929de8b8e2fa9656968c0c2a8201725435350e27553fedc140ac6fe7b5f
3
+ size 25174016
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f875bd819c2414eb5a3b5a69cb6ee4f3525a6abd92794d5cae8eb49e5b86e5e4
3
+ size 29360128
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a298abe75f0c10e0a5c8f2f4ca0d0850a3319e50e24b7dca140c1ecc8a711de
3
+ size 58720256
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad82de844c98f9054bb98a28d944d52c48dc1149a63b0adb34446f0a5af7cee5
3
+ size 33046528
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:179323c847f5fc97586670a423706513c1573f01a80bfe4a06a83176a11aa1e7
3
+ size 58720256
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c394d2ff4b15f502b4bdc93bd4a9441ec6bec4522d113e7df90ba8c810488e42
3
+ size 32505856
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66bcd1cd7d57e49820d6d81c9c10dd30e10e3081c6a88ddcc4f54dbb98561f9e
3
+ size 9437184
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:787def81ea0863f93f1270860733c9a206b1771e51d2878630a236206f75669d
3
+ size 29360128
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f2fdcd294f41180360ba1c5f2076371343a9b526528faf1a8e27f162509bfbf
3
+ size 58720256
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd3a66f25cf7122533187810b04f8b2cc7d90b4d7db518d88e3ad83fc8cbd78f
3
+ size 22036480
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adb939b359fa54f4523d293425c0be9071f1ceb076c659fa8e31f0130478dd93
3
+ size 29360128
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bc0c25cca436c84734b8d7c7231dc8a1395b54204e8d5a29aad62826bab9c69
3
+ size 58720256
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c2d7e2103c0fc4dbf6ed13ecd16cb3b9f2885ebdeabd076402850eb5756a4f5
3
+ size 27271168
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bf62ac99315d05517cc6085f5c049b44e0e361c3c2e6f3652c21a878254944a
3
+ size 29360128
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b8739a4224814ec88c4959ebe61e276c3b473d87f16f9806a93f27c3dfbf54a
3
+ size 30949376
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1970056327462ce4a298888a39fd7c22da856df8db48e2075c7cebc71af08294
3
+ size 58720256
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51a9b6306f18ca13b235f5a418551c8ef8bf42f6ad87b1d4fd08207811a65184
3
+ size 32841728
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81dc5a2100e07e601b757135a6a005c1923b4bcec87f958415293b4619e07a9a
3
+ size 25174016
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:772ee0a2b032e77274242c394a14ef48a998ed4f254e6442fdde8ef890cc03ab
3
+ size 29360128
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72087c1d9f08339b637103322a9baa2d73cc97a761ca23526edabe7350aaf428
3
+ size 58720256
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c12bb684ebb8996a56eb26c40082b60d0a45700352802c478f9a17ee4a7d9224
3
+ size 33046528
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93b4df532253c33428f2c2ddaedaa4d438bf97965895884eb903583481e574fb
3
+ size 29360128
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df2bd1a8972b1afac47ec82f79e6b91f811b331bdc0ebcec450c5c7532d66286
3
+ size 58720256
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd5e1379414cb5effa44de3c8cff9ece4dcdfd4838d534fcd11f9063206a9083
3
+ size 22036480
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb75b9c3203a6c7c843e9c49a571e505ab4cc68895cb04bac017480b3f86e5a2
3
+ size 29360128
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dfe5df317adbc5f67e12db2ae3044441a76598aa9260a16eeab7ab48a88d2b8
3
+ size 58720256
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:289bd1c3461917d8752892e97032ec482e4fd1f9e72205fa08da7c5e2416aff7
3
+ size 27271168
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa8d6f717e80239b7a9dd7378be7b6d044e880e83ed875031be2414f672e2ae0
3
+ size 262668288
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64739151a5eda6128b4b43c84dccc73d08a77c7676c990e946669ff168aef0c1
3
+ size 29360128
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89d57876cd0bbd35f05b6e4c6dc4a74248646630b27dd14671bd99f0d555cc84
3
+ size 30949376
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd9089e99ea92e7855f166932724397ce30292075ec3f03b706c6702cedb9a49
3
+ size 58720256
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48a9c9c1b772277a244d6fa95843e5ef1e2bc2aa7a4c5ba1dc3e9288dd53eb13
3
+ size 25174016
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:745428d666b40125cacab89536ccca866c2e30f0f5f2bb35a76df2a95a0a2dda
3
+ size 29360128
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e5311e63eff5fb4d1bee134225928b1761f03b337bf746aac53a621065cebf6
3
+ size 58720256
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6a5eac7684f257fc5876d7fc322f6873b6dfd996f4678b85164538c6e212a66
3
+ size 33046528
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a274c716a08f95d2b7d41b1d3fea55cc03e635585ae04e3e507787fbf7bd8600
3
+ size 29360128
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f571d7599043ecaf4b4ae4dca407bbe4d03f6252d49735d692ebfb58f081ca13
3
+ size 58720256
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abab295899b20da9f725d463c1d89a2e80c2870707c2269173ebb5c6ae5f9672
3
+ size 22036480
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d801a55c87ab86adba4e3be81c52f3a24894b687f3169132a0062c0e4840e53
3
+ size 32833536
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a59220800ba74e4cbc4787e759b0c2d2668a8eaa5ad657aebfe748fc6b8f03e
3
+ size 29360128
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db9b1ef6f87d27d40cfcbf9c6c0a08ae520f0d3ea25ae00669e46b37e0b02ef0
3
+ size 58720256
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9031b53be10408597e62141a93019d9512643102b29f34aaf8d26d63cbe62f7
3
+ size 27271168
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1603f6a5b637521317b2e1e83913482613cf58e81d430ce28079bcc17cb5715
3
+ size 29360128
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bbdd819e23307e803326c107e261d0e739ec0d344a103d5f3faf90e3cd892b0
3
+ size 30949376