Training in progress, epoch 1
Browse files- config.json +1 -1
- model-00001-of-00002.safetensors +1 -1
- model-00002-of-00002.safetensors +2 -2
- model.safetensors.index.json +2 -1
- runs/Jan28_13-13-12_ip-172-31-27-247/events.out.tfevents.1738069999.ip-172-31-27-247.32100.0 +3 -0
- runs/Jan28_13-14-16_ip-172-31-27-247/events.out.tfevents.1738070064.ip-172-31-27-247.32540.0 +3 -0
- runs/Jan28_13-15-28_ip-172-31-27-247/events.out.tfevents.1738070135.ip-172-31-27-247.32910.0 +3 -0
- runs/Jan28_13-16-03_ip-172-31-27-247/events.out.tfevents.1738070170.ip-172-31-27-247.33225.0 +3 -0
- runs/Jan28_13-16-54_ip-172-31-27-247/events.out.tfevents.1738070221.ip-172-31-27-247.33551.0 +3 -0
- runs/Jan28_13-17-31_ip-172-31-27-247/events.out.tfevents.1738070258.ip-172-31-27-247.33880.0 +3 -0
- runs/Jan28_13-18-09_ip-172-31-27-247/events.out.tfevents.1738070296.ip-172-31-27-247.34205.0 +3 -0
- runs/Jan28_13-21-58_ip-172-31-27-247/events.out.tfevents.1738070528.ip-172-31-27-247.34674.0 +3 -0
- runs/Jan28_13-23-08_ip-172-31-27-247/events.out.tfevents.1738070598.ip-172-31-27-247.35102.0 +3 -0
- runs/Jan28_13-24-21_ip-172-31-27-247/events.out.tfevents.1738070671.ip-172-31-27-247.35631.0 +3 -0
- runs/Jan28_13-29-15_ip-172-31-27-247/events.out.tfevents.1738070965.ip-172-31-27-247.36065.0 +3 -0
- runs/Jan29_02-12-46_ip-172-31-27-247/events.out.tfevents.1738116777.ip-172-31-27-247.38694.0 +3 -0
- runs/Jan29_02-13-56_ip-172-31-27-247/events.out.tfevents.1738116846.ip-172-31-27-247.39125.0 +3 -0
- runs/Jan29_02-14-33_ip-172-31-27-247/events.out.tfevents.1738116884.ip-172-31-27-247.39550.0 +3 -0
- runs/Jan29_02-15-14_ip-172-31-27-247/events.out.tfevents.1738116924.ip-172-31-27-247.39975.0 +3 -0
- runs/Jan29_02-17-30_ip-172-31-27-247/events.out.tfevents.1738117064.ip-172-31-27-247.40457.0 +3 -0
- training_args.bin +2 -2
config.json
CHANGED
@@ -31,6 +31,6 @@
|
|
31 |
"tie_word_embeddings": true,
|
32 |
"torch_dtype": "bfloat16",
|
33 |
"transformers_version": "4.46.3",
|
34 |
-
"use_cache":
|
35 |
"vocab_size": 128256
|
36 |
}
|
|
|
31 |
"tie_word_embeddings": true,
|
32 |
"torch_dtype": "bfloat16",
|
33 |
"transformers_version": "4.46.3",
|
34 |
+
"use_cache": false,
|
35 |
"vocab_size": 128256
|
36 |
}
|
model-00001-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4965799096
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1beab377e4ee892b6e614e72bd6aafa63770b1cdee9e37f47b389fe7a2d50cce
|
3 |
size 4965799096
|
model-00002-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8059981fa1d26b15573abce1274ff618545c8ae3e916bea80e995ab74f55f903
|
3 |
+
size 2247734992
|
model.safetensors.index.json
CHANGED
@@ -1,8 +1,9 @@
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
-
"total_size":
|
4 |
},
|
5 |
"weight_map": {
|
|
|
6 |
"model.embed_tokens.weight": "model-00001-of-00002.safetensors",
|
7 |
"model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors",
|
8 |
"model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors",
|
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
+
"total_size": 7213504512
|
4 |
},
|
5 |
"weight_map": {
|
6 |
+
"lm_head.weight": "model-00002-of-00002.safetensors",
|
7 |
"model.embed_tokens.weight": "model-00001-of-00002.safetensors",
|
8 |
"model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors",
|
9 |
"model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors",
|
runs/Jan28_13-13-12_ip-172-31-27-247/events.out.tfevents.1738069999.ip-172-31-27-247.32100.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a301fac4786a5c28ed806d45d05299ce83569953a5cfd9853e5a2d5048b7144
|
3 |
+
size 5875
|
runs/Jan28_13-14-16_ip-172-31-27-247/events.out.tfevents.1738070064.ip-172-31-27-247.32540.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30a95964b01186216a41b78ac6aa1e4f0131c613725dd4f4d8c0da0e962a785f
|
3 |
+
size 5667
|
runs/Jan28_13-15-28_ip-172-31-27-247/events.out.tfevents.1738070135.ip-172-31-27-247.32910.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc188043c246e4041ddc018873bab92273a433f60b35e777d56f273704b58624
|
3 |
+
size 5665
|
runs/Jan28_13-16-03_ip-172-31-27-247/events.out.tfevents.1738070170.ip-172-31-27-247.33225.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bf28b6872c8f211e64350015d3940dc13426b7e0153f86d44f5cf824654a343
|
3 |
+
size 5665
|
runs/Jan28_13-16-54_ip-172-31-27-247/events.out.tfevents.1738070221.ip-172-31-27-247.33551.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aa8592d9d2ede51db89e6db3ef18e92f1797a907fb570bc44689c574dca6b03
|
3 |
+
size 5665
|
runs/Jan28_13-17-31_ip-172-31-27-247/events.out.tfevents.1738070258.ip-172-31-27-247.33880.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2be4dd6c0a8e94e6f3b606b5aa56120679eec9c971c7635aeaed7c4cef20c36
|
3 |
+
size 5665
|
runs/Jan28_13-18-09_ip-172-31-27-247/events.out.tfevents.1738070296.ip-172-31-27-247.34205.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:315a1e3543c3a20aaeb8565b1795d47ac5584403b2dce336a8e9fd5847f0691f
|
3 |
+
size 5665
|
runs/Jan28_13-21-58_ip-172-31-27-247/events.out.tfevents.1738070528.ip-172-31-27-247.34674.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec923c92a03f56cf3719e9a615febac933a973df083334eca46a586ebc2134ad
|
3 |
+
size 5665
|
runs/Jan28_13-23-08_ip-172-31-27-247/events.out.tfevents.1738070598.ip-172-31-27-247.35102.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0efb8a05d4020eeddb13d76ba95f611d80658506d0204d171939a40fdc9f8944
|
3 |
+
size 5876
|
runs/Jan28_13-24-21_ip-172-31-27-247/events.out.tfevents.1738070671.ip-172-31-27-247.35631.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:954a6049e60bfd3c7af90055362eadeaf3f712b958d31cd28e73548dba18465d
|
3 |
+
size 5663
|
runs/Jan28_13-29-15_ip-172-31-27-247/events.out.tfevents.1738070965.ip-172-31-27-247.36065.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bead1a3cfb0074a9ea11e945f32cd7f69809292f8629c7b09beb24ea99e5ade3
|
3 |
+
size 125412
|
runs/Jan29_02-12-46_ip-172-31-27-247/events.out.tfevents.1738116777.ip-172-31-27-247.38694.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d462bb712b1c910b2a76da4b5e729f7245ab0e2ce07daafc92f90e256b6f774d
|
3 |
+
size 5662
|
runs/Jan29_02-13-56_ip-172-31-27-247/events.out.tfevents.1738116846.ip-172-31-27-247.39125.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f1c8109e1fa8790e42f3545a0b844c8c5b7ba3a5edba77facbfbe060c007222
|
3 |
+
size 5664
|
runs/Jan29_02-14-33_ip-172-31-27-247/events.out.tfevents.1738116884.ip-172-31-27-247.39550.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a46e558d0d05462dde5144aa224c13b820ed7183ef254001d2265c599a797c6f
|
3 |
+
size 5663
|
runs/Jan29_02-15-14_ip-172-31-27-247/events.out.tfevents.1738116924.ip-172-31-27-247.39975.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8b9830a61b467cd23a151e456dc8f63072df096e3adde92d519289ef1d9e56b
|
3 |
+
size 5662
|
runs/Jan29_02-17-30_ip-172-31-27-247/events.out.tfevents.1738117064.ip-172-31-27-247.40457.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fe66f214690274f5c7edc844ad7cbc94e2b989925eba76ceb54395dc49c6a17
|
3 |
+
size 471237
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4fdf4fd260cf9e8fbf76f39401fc46927fd57a8e9c182403767a89396e3cac0
|
3 |
+
size 6904
|