saberai commited on
Commit
07f17ae
·
1 Parent(s): 3ac4df8

Update mlc-chat-config.json

Browse files
Files changed (1) hide show
  1. mlc-chat-config.json +17 -39
mlc-chat-config.json CHANGED
@@ -1,41 +1,19 @@
1
  {
2
- "model_type": "gpt_neox",
3
- "quantization": "q4f16_1",
4
- "model_config": {
5
- "use_parallel_residual": false,
6
- "hidden_size": 2560,
7
- "intermediate_size": 10240,
8
- "num_attention_heads": 32,
9
- "num_hidden_layers": 32,
10
- "layer_norm_eps": 1e-05,
11
- "vocab_size": 50432,
12
- "rotary_pct": 1.0,
13
- "position_embedding_base": 10000,
14
- "context_window_size": 2048,
15
- "head_dim": 80,
16
- "prefill_chunk_size": 2048,
17
- "tensor_parallel_shards": 1,
18
- "ffn_out_dtype": "float32"
19
- },
20
- "vocab_size": 50432,
21
- "context_window_size": 2048,
22
- "sliding_window_size": -1,
23
- "prefill_chunk_size": 2048,
24
- "attention_sink_size": -1,
25
- "tensor_parallel_shards": 1,
26
- "mean_gen_len": 128,
27
- "max_gen_len": 512,
28
- "shift_fill_factor": 0.3,
29
- "temperature": 0.7,
30
- "repetition_penalty": 1.0,
31
- "top_p": 0.95,
32
- "conv_template": "redpajama_chat",
33
- "pad_token_id": 0,
34
- "bos_token_id": 0,
35
- "eos_token_id": 0,
36
- "tokenizer_files": [
37
- "tokenizer.json",
38
- "tokenizer_config.json"
39
- ],
40
- "version": "0.1.0"
41
  }
 
1
  {
2
+ "model_lib": "RedPajama-INCITE-Chat-3B-v1-q4f16_1",
3
+ "local_id": "RedPajama-INCITE-Chat-3B-v1-q4f16_1",
4
+ "conv_template": "redpajama_chat",
5
+ "temperature": 0.7,
6
+ "repetition_penalty": 1.01,
7
+ "top_p": 0.95,
8
+ "mean_gen_len": 128,
9
+ "max_gen_len": 512,
10
+ "shift_fill_factor": 0.3,
11
+ "estimated_vram_req": 2254857830,
12
+ "tokenizer_files": [
13
+ "tokenizer.json"
14
+ ],
15
+ "model_category": "gpt_neox",
16
+ "model_name": "RedPajama-INCITE-Chat-3B-v1",
17
+ "max_window_size": 2048,
18
+ "vocab_size": 50432
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }