Update mlc-chat-config.json
Browse files- mlc-chat-config.json +3 -3
mlc-chat-config.json
CHANGED
@@ -10,16 +10,16 @@
|
|
10 |
"vocab_size": 128256,
|
11 |
"position_embedding_base": 500000.0,
|
12 |
"context_window_size": 8192,
|
13 |
-
"prefill_chunk_size":
|
14 |
"num_key_value_heads": 8,
|
15 |
"head_dim": 128,
|
16 |
"tensor_parallel_shards": 1,
|
17 |
-
"max_batch_size":
|
18 |
},
|
19 |
"vocab_size": 128256,
|
20 |
"context_window_size": 8192,
|
21 |
"sliding_window_size": -1,
|
22 |
-
"prefill_chunk_size":
|
23 |
"attention_sink_size": -1,
|
24 |
"tensor_parallel_shards": 1,
|
25 |
"mean_gen_len": 128,
|
|
|
10 |
"vocab_size": 128256,
|
11 |
"position_embedding_base": 500000.0,
|
12 |
"context_window_size": 8192,
|
13 |
+
"prefill_chunk_size": 8192,
|
14 |
"num_key_value_heads": 8,
|
15 |
"head_dim": 128,
|
16 |
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 128
|
18 |
},
|
19 |
"vocab_size": 128256,
|
20 |
"context_window_size": 8192,
|
21 |
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 8192,
|
23 |
"attention_sink_size": -1,
|
24 |
"tensor_parallel_shards": 1,
|
25 |
"mean_gen_len": 128,
|