ruihanglai commited on
Commit
415c1c4
1 Parent(s): d16fcff

Update mlc-chat-config.json

Browse files
Files changed (1) hide show
  1. mlc-chat-config.json +3 -3
mlc-chat-config.json CHANGED
@@ -19,17 +19,17 @@
19
  "rope_type": "llama3"
20
  },
21
  "context_window_size": 131072,
22
- "prefill_chunk_size": 2048,
23
  "num_key_value_heads": 8,
24
  "head_dim": 128,
25
  "tensor_parallel_shards": 1,
26
  "pipeline_parallel_stages": 1,
27
- "max_batch_size": 80
28
  },
29
  "vocab_size": 128256,
30
  "context_window_size": 131072,
31
  "sliding_window_size": -1,
32
- "prefill_chunk_size": 2048,
33
  "attention_sink_size": -1,
34
  "tensor_parallel_shards": 1,
35
  "pipeline_parallel_stages": 1,
 
19
  "rope_type": "llama3"
20
  },
21
  "context_window_size": 131072,
22
+ "prefill_chunk_size": 8192,
23
  "num_key_value_heads": 8,
24
  "head_dim": 128,
25
  "tensor_parallel_shards": 1,
26
  "pipeline_parallel_stages": 1,
27
+ "max_batch_size": 128
28
  },
29
  "vocab_size": 128256,
30
  "context_window_size": 131072,
31
  "sliding_window_size": -1,
32
+ "prefill_chunk_size": 8192,
33
  "attention_sink_size": -1,
34
  "tensor_parallel_shards": 1,
35
  "pipeline_parallel_stages": 1,