Text Generation
Transformers
Safetensors
Finnish
llama
finnish
conversational
text-generation-inference
aapot commited on
Commit
ce7ff6d
1 Parent(s): 9ced1e8

Add 2-stage 1060k step model

Browse files
config.json CHANGED
@@ -11,6 +11,7 @@
11
  "initializer_range": 0.02,
12
  "intermediate_size": 8640,
13
  "max_position_embeddings": 2048,
 
14
  "model_type": "llama",
15
  "num_attention_heads": 32,
16
  "num_hidden_layers": 26,
@@ -21,7 +22,7 @@
21
  "rope_theta": 10000.0,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "float16",
24
- "transformers_version": "4.38.0.dev0",
25
  "use_cache": true,
26
  "vocab_size": 64256
27
  }
 
11
  "initializer_range": 0.02,
12
  "intermediate_size": 8640,
13
  "max_position_embeddings": 2048,
14
+ "mlp_bias": false,
15
  "model_type": "llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 26,
 
22
  "rope_theta": 10000.0,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "float16",
25
+ "transformers_version": "4.42.0.dev0",
26
  "use_cache": true,
27
  "vocab_size": 64256
28
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
- "transformers_version": "4.38.0.dev0"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
+ "transformers_version": "4.42.0.dev0"
6
  }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:944f734c9d4facd84eb7b415f59bbd9c5463ccdf685b246fc08855c8cb5870b0
3
  size 4953951976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebea50b3d4ba830085a26f5a608edeaf36f78c3bc5b5c81c83ebec436576116c
3
  size 4953951976
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8115805319bd7f4bfc318984ab8651e8a5f1120a5548de36bb6244069d74eb2e
3
  size 2311899224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0296bfe931223bd0ecb717a60bb9aea6ac40ab6c7e960f0a897eb9e8e2550c8b
3
  size 2311899224