sjrhuschlee commited on
Commit
ef67aae
1 Parent(s): e37bbbc

Delete merged_model/config.json

Browse files
Files changed (1) hide show
  1. merged_model/config.json +0 -32
merged_model/config.json DELETED
@@ -1,32 +0,0 @@
1
- {
2
- "_name_or_path": "google/flan-t5-large",
3
- "architectures": [
4
- "T5ForQuestionAnswering"
5
- ],
6
- "d_ff": 2816,
7
- "d_kv": 64,
8
- "d_model": 1024,
9
- "decoder_start_token_id": 0,
10
- "dense_act_fn": "gelu_new",
11
- "dropout_rate": 0.1,
12
- "eos_token_id": 1,
13
- "feed_forward_proj": "gated-gelu",
14
- "initializer_factor": 1.0,
15
- "is_encoder_decoder": true,
16
- "is_gated_act": true,
17
- "layer_norm_epsilon": 1e-06,
18
- "model_type": "t5",
19
- "n_positions": 512,
20
- "num_decoder_layers": 24,
21
- "num_heads": 16,
22
- "num_layers": 24,
23
- "output_past": true,
24
- "pad_token_id": 0,
25
- "relative_attention_max_distance": 128,
26
- "relative_attention_num_buckets": 32,
27
- "tie_word_embeddings": false,
28
- "torch_dtype": "float32",
29
- "transformers_version": "4.31.0.dev0",
30
- "use_cache": true,
31
- "vocab_size": 32128
32
- }