mnoukhov commited on
Commit
4c682ba
1 Parent(s): 651c753

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. config.json +2 -1
  2. model.safetensors +1 -1
  3. tokenizer.json +0 -0
  4. training_args.bin +2 -2
config.json CHANGED
@@ -7,6 +7,7 @@
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 1,
9
  "eos_token_id": 2,
 
10
  "hidden_act": "silu",
11
  "hidden_size": 576,
12
  "initializer_range": 0.041666666666666664,
@@ -32,7 +33,7 @@
32
  "q4f16": "float16"
33
  }
34
  },
35
- "transformers_version": "4.37.2",
36
  "use_cache": true,
37
  "vocab_size": 49152
38
  }
 
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 1,
9
  "eos_token_id": 2,
10
+ "head_dim": 64,
11
  "hidden_act": "silu",
12
  "hidden_size": 576,
13
  "initializer_range": 0.041666666666666664,
 
33
  "q4f16": "float16"
34
  }
35
  },
36
+ "transformers_version": "4.46.2",
37
  "use_cache": true,
38
  "vocab_size": 49152
39
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3743619989cdc9de8de17473276e1fc25b6dd172faab798e9931f4b96aee761
3
  size 538090408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32bbe7ad0654dc7683a73bf6f8915862ccfc1eec9d95cb89a4e3b9212b765709
3
  size 538090408
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa82d7a9095ed13ceeb90bf43e8ab0f46ef1f02469ca3c75f77f1cce2c407f5e
3
- size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91a73bf304a4f4427be6627ca979e2c8c81a81c93d8121ccb55f95ba188acb62
3
+ size 5880