muverqqw commited on
Commit
9f3eb71
·
verified ·
1 Parent(s): 030a406

Step Final_Loss6.35_Tok19.69M

Browse files
config.json CHANGED
@@ -1,10 +1,14 @@
1
  {
 
 
 
2
  "attention_dropout": 0.0,
3
  "auto_map": {
4
  "AutoConfig": "configuration_alinlight.AlinlightConfig",
5
  "AutoModelForCausalLM": "modeling_alinlight.AlinlightForCausalLM"
6
  },
7
  "bos_token_id": 1,
 
8
  "eos_token_id": 2,
9
  "hidden_size": 2048,
10
  "initializer_range": 0.02,
@@ -20,6 +24,6 @@
20
  "rope_theta": 10000.0,
21
  "sliding_window": 4096,
22
  "transformers_version": "4.57.3",
23
- "use_cache": true,
24
  "vocab_size": 128000
25
  }
 
1
  {
2
+ "architectures": [
3
+ "AlinlightForCausalLM"
4
+ ],
5
  "attention_dropout": 0.0,
6
  "auto_map": {
7
  "AutoConfig": "configuration_alinlight.AlinlightConfig",
8
  "AutoModelForCausalLM": "modeling_alinlight.AlinlightForCausalLM"
9
  },
10
  "bos_token_id": 1,
11
+ "dtype": "bfloat16",
12
  "eos_token_id": 2,
13
  "hidden_size": 2048,
14
  "initializer_range": 0.02,
 
24
  "rope_theta": 10000.0,
25
  "sliding_window": 4096,
26
  "transformers_version": "4.57.3",
27
+ "use_cache": false,
28
  "vocab_size": 128000
29
  }
pytorch_model-00001-of-00006.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ab51fd1e1219b0f85c930c88f2b7e748a36cf3b36fa08f6091f6fca5fd466af
3
  size 524289980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:509c55c9f5afb0bbf941e26423d78618a5934f418098511995df96f964e7c368
3
  size 524289980
pytorch_model-00002-of-00006.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c475cea54fd3d325ec01f5fe3d9d3b52f9caf92e9052b2229668c5812d132a65
3
  size 494988197
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b38721d209392513c4bff257430122fe5b675b7a87d4c87f82babeee3fcd0856
3
  size 494988197
pytorch_model-00003-of-00006.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77b5ed70297d115bd84daa7af1cceee6534b98af1607ec3ea12928e0439eb6d7
3
  size 497093139
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afe49bbba75c82843adab077a3bda5d9d390d26f9d8ff9261adff45327c5bb09
3
  size 497093139
pytorch_model-00004-of-00006.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fd28fd3752d7e4d61cf889ff5d2164a0c761daa9eed8815f4fca4392e88856c
3
  size 494988261
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b94a62e15ef52b6bb327fdd5b32868ac12d8eb817187a90ff49373a4b73e7d5f
3
  size 494988261
pytorch_model-00005-of-00006.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33045b4cf46b467ee042ab1ee1410375b14a09d22dddfa914acc95e988e09668
3
  size 524289916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a92f5333b7c27923a58fe01a22019ecc33e17bba7c4e8e828a8e36ee17b2dd2f
3
  size 524289916
pytorch_model-00006-of-00006.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c4a7602ae11439b0e62f5e06b3cf1491fd20bab3dbcd09f9ed2372e11de8663
3
  size 497097637
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e298624cdfbe1a06820afda5dc6f897e260b49cddc1507bcb1c431997cc39c00
3
  size 497097637