BaoHuynh2002 commited on
Commit
cd6568c
1 Parent(s): 6fd593e

Upload MPTForCausalLM

Browse files
Files changed (3) hide show
  1. config.json +73 -0
  2. generation_config.json +5 -0
  3. pytorch_model.bin +3 -0
config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "vinai/PhoGPT-4B-Chat",
3
+ "architectures": [
4
+ "MPTForCausalLM"
5
+ ],
6
+ "attn_config": {
7
+ "alibi": true,
8
+ "alibi_bias_max": 8,
9
+ "attn_impl": "torch",
10
+ "attn_pdrop": 0.0,
11
+ "attn_type": "multihead_attention",
12
+ "attn_uses_sequence_id": false,
13
+ "clip_qkv": null,
14
+ "prefix_lm": false,
15
+ "qk_gn": false,
16
+ "qk_ln": false,
17
+ "rope": false,
18
+ "rope_dail_config": {
19
+ "pos_idx_in_fp32": true,
20
+ "type": "original",
21
+ "xpos_scale_base": 512
22
+ },
23
+ "rope_hf_config": {
24
+ "factor": 1.0,
25
+ "type": "no_scaling"
26
+ },
27
+ "rope_impl": "dail",
28
+ "rope_theta": 10000,
29
+ "sliding_window_size": -1,
30
+ "softmax_scale": null
31
+ },
32
+ "auto_map": {
33
+ "AutoConfig": "vinai/PhoGPT-4B-Chat--configuration_mpt.MPTConfig",
34
+ "AutoModelForCausalLM": "vinai/PhoGPT-4B-Chat--modeling_mpt.MPTForCausalLM"
35
+ },
36
+ "d_model": 3072,
37
+ "emb_pdrop": 0.0,
38
+ "embedding_fraction": 1.0,
39
+ "expansion_ratio": 4,
40
+ "fc_type": "torch",
41
+ "ffn_config": {
42
+ "fc_type": "torch",
43
+ "ffn_type": "mptmlp"
44
+ },
45
+ "init_config": {
46
+ "emb_init_std": null,
47
+ "emb_init_uniform_lim": null,
48
+ "fan_mode": "fan_in",
49
+ "init_div_is_residual": true,
50
+ "init_gain": 0.0,
51
+ "init_nonlinearity": "relu",
52
+ "init_std": null,
53
+ "name": "kaiming_normal_",
54
+ "verbose": 0
55
+ },
56
+ "init_device": "cpu",
57
+ "learned_pos_emb": false,
58
+ "logit_scale": null,
59
+ "max_seq_len": 8192,
60
+ "model_type": "mpt",
61
+ "n_heads": 24,
62
+ "n_layers": 32,
63
+ "no_bias": false,
64
+ "norm_type": "low_precision_layernorm",
65
+ "pretraining_tp": 1,
66
+ "resid_pdrop": 0.0,
67
+ "torch_dtype": "bfloat16",
68
+ "transformers_version": "4.31.0",
69
+ "use_cache": false,
70
+ "use_pad_tok_in_ffn": true,
71
+ "verbose": 0,
72
+ "vocab_size": 20480
73
+ }
generation_config.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "transformers_version": "4.31.0",
4
+ "use_cache": false
5
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96ed0c77d891d76c33f7b3014f65d7c36d0207432d9596c123d148cb17334421
3
+ size 7376285862