Text Generation
Transformers
PyTorch
Japanese
open-llama
Inference Endpoints
tahomatx commited on
Commit
13f2a3e
1 Parent(s): 18cb820

Upload OpenLlamaForCausalLM (#4)

Browse files

- Upload OpenLlamaForCausalLM (650775b9e7d473b08c6f150ed58aa22d00918f5e)

Files changed (2) hide show
  1. config.json +3 -3
  2. pytorch_model.bin +2 -2
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "/mnt/n/ml/models/aerner/lm-v2/checkpoint-76000",
3
  "architectures": [
4
- "LlamaForCausalLM"
5
  ],
6
  "attention_dropout_prob": 0.1,
7
  "bos_token_id": 1,
@@ -12,7 +12,7 @@
12
  "initializer_range": 0.02,
13
  "intermediate_size": 11008,
14
  "max_position_embeddings": 2048,
15
- "model_type": "llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 8,
18
  "pad_token_id": 0,
 
1
  {
2
+ "_name_or_path": "/mnt/n/ml/models/aerner/lm-v2/checkpoint-76200",
3
  "architectures": [
4
+ "OpenLlamaForCausalLM"
5
  ],
6
  "attention_dropout_prob": 0.1,
7
  "bos_token_id": 1,
 
12
  "initializer_range": 0.02,
13
  "intermediate_size": 11008,
14
  "max_position_embeddings": 2048,
15
+ "model_type": "open-llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 8,
18
  "pad_token_id": 0,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9af5ea94b7d6af2b5c99464086434f26ae3a681d767bd29674ded3b51f22336a
3
- size 2169864106
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8c5dd165b8fc67f0aac39e7162adde3a7aae9c039b5a2d92100dfb2fd91d90d
3
+ size 1760272621