mlc-ai
/

Llama-3-70B-Instruct-q4f16_1-MLC

Model card Files Files and versions Community

ruihanglai commited on Sep 19, 2024

Commit

b10e55e

·

verified ·

1 Parent(s): 6f3a9d9

Update mlc-chat-config.json

Files changed (1) hide show

mlc-chat-config.json +3 -3

mlc-chat-config.json CHANGED Viewed

@@ -10,16 +10,16 @@
     "vocab_size": 128256,
     "position_embedding_base": 500000.0,
     "context_window_size": 8192,
-    "prefill_chunk_size": 2048,
     "num_key_value_heads": 8,
     "head_dim": 128,
     "tensor_parallel_shards": 1,
-    "max_batch_size": 80
   },
   "vocab_size": 128256,
   "context_window_size": 8192,
   "sliding_window_size": -1,
-  "prefill_chunk_size": 2048,
   "attention_sink_size": -1,
   "tensor_parallel_shards": 1,
   "mean_gen_len": 128,

     "vocab_size": 128256,
     "position_embedding_base": 500000.0,
     "context_window_size": 8192,
+    "prefill_chunk_size": 8192,
     "num_key_value_heads": 8,
     "head_dim": 128,
     "tensor_parallel_shards": 1,
+    "max_batch_size": 128
   },
   "vocab_size": 128256,
   "context_window_size": 8192,
   "sliding_window_size": -1,
+  "prefill_chunk_size": 8192,
   "attention_sink_size": -1,
   "tensor_parallel_shards": 1,
   "mean_gen_len": 128,