aapot commited on
Commit
025a638
1 Parent(s): c8a9735

Add 750k step model

Browse files
Files changed (3) hide show
  1. config.json +4 -1
  2. generation_config.json +1 -1
  3. pytorch_model.bin +1 -1
config.json CHANGED
@@ -12,11 +12,14 @@
12
  "model_type": "llama",
13
  "num_attention_heads": 32,
14
  "num_hidden_layers": 26,
 
15
  "pad_token_id": 0,
 
16
  "rms_norm_eps": 1e-06,
 
17
  "tie_word_embeddings": false,
18
  "torch_dtype": "float16",
19
- "transformers_version": "4.31.0.dev0",
20
  "use_cache": true,
21
  "vocab_size": 64256
22
  }
 
12
  "model_type": "llama",
13
  "num_attention_heads": 32,
14
  "num_hidden_layers": 26,
15
+ "num_key_value_heads": 32,
16
  "pad_token_id": 0,
17
+ "pretraining_tp": 1,
18
  "rms_norm_eps": 1e-06,
19
+ "rope_scaling": null,
20
  "tie_word_embeddings": false,
21
  "torch_dtype": "float16",
22
+ "transformers_version": "4.32.0.dev0",
23
  "use_cache": true,
24
  "vocab_size": 64256
25
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.31.0.dev0"
7
  }
 
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.32.0.dev0"
7
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2185d8ab92e60d219c064f5e75e81d9ed0cf560c22654553cbb64b746fb72db3
3
  size 7265915001
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1854b80d81867d3b5bb0f5c251f87139f0fc4a0331099255dddcd470de936391
3
  size 7265915001