Upload folder using huggingface_hub
Browse files- mlc-chat-config.json +3 -3
mlc-chat-config.json
CHANGED
@@ -140,15 +140,15 @@
|
|
140 |
},
|
141 |
"original_max_position_embeddings": 4096,
|
142 |
"context_window_size": 131072,
|
143 |
-
"prefill_chunk_size":
|
144 |
"head_dim": 96,
|
145 |
"tensor_parallel_shards": 1,
|
146 |
-
"max_batch_size":
|
147 |
},
|
148 |
"vocab_size": 32064,
|
149 |
"context_window_size": 131072,
|
150 |
"sliding_window_size": -1,
|
151 |
-
"prefill_chunk_size":
|
152 |
"attention_sink_size": -1,
|
153 |
"tensor_parallel_shards": 1,
|
154 |
"pipeline_parallel_stages": 1,
|
|
|
140 |
},
|
141 |
"original_max_position_embeddings": 4096,
|
142 |
"context_window_size": 131072,
|
143 |
+
"prefill_chunk_size": 8192,
|
144 |
"head_dim": 96,
|
145 |
"tensor_parallel_shards": 1,
|
146 |
+
"max_batch_size": 128
|
147 |
},
|
148 |
"vocab_size": 32064,
|
149 |
"context_window_size": 131072,
|
150 |
"sliding_window_size": -1,
|
151 |
+
"prefill_chunk_size": 8192,
|
152 |
"attention_sink_size": -1,
|
153 |
"tensor_parallel_shards": 1,
|
154 |
"pipeline_parallel_stages": 1,
|