TNT3530 commited on
Commit
f5122d4
1 Parent(s): 64bd952

Update mlc-chat-config.json

Browse files
Files changed (1) hide show
  1. mlc-chat-config.json +4 -4
mlc-chat-config.json CHANGED
@@ -12,24 +12,24 @@
12
  "intermediate_size": 22528,
13
  "layer_norm_eps": 1e-05,
14
  "position_embedding_base": 8000000.0,
15
- "context_window_size": 8192,
16
  "prefill_chunk_size": 2048,
17
  "head_dim": 128,
18
  "tensor_parallel_shards": 1,
19
  "max_batch_size": 80
20
  },
21
  "vocab_size": 256000,
22
- "context_window_size": 8192,
23
  "sliding_window_size": -1,
24
  "prefill_chunk_size": 2048,
25
  "attention_sink_size": -1,
26
  "tensor_parallel_shards": 1,
27
  "pipeline_parallel_stages": 1,
28
- "temperature": 1.0,
29
  "presence_penalty": 0.0,
30
  "frequency_penalty": 0.0,
31
  "repetition_penalty": 1.0,
32
- "top_p": 1.0,
33
  "tokenizer_files": [
34
  "tokenizer.json",
35
  "tokenizer_config.json"
 
12
  "intermediate_size": 22528,
13
  "layer_norm_eps": 1e-05,
14
  "position_embedding_base": 8000000.0,
15
+ "context_window_size": 131072,
16
  "prefill_chunk_size": 2048,
17
  "head_dim": 128,
18
  "tensor_parallel_shards": 1,
19
  "max_batch_size": 80
20
  },
21
  "vocab_size": 256000,
22
+ "context_window_size": 131072,
23
  "sliding_window_size": -1,
24
  "prefill_chunk_size": 2048,
25
  "attention_sink_size": -1,
26
  "tensor_parallel_shards": 1,
27
  "pipeline_parallel_stages": 1,
28
+ "temperature": 0.85,
29
  "presence_penalty": 0.0,
30
  "frequency_penalty": 0.0,
31
  "repetition_penalty": 1.0,
32
+ "top_p": 0.95,
33
  "tokenizer_files": [
34
  "tokenizer.json",
35
  "tokenizer_config.json"