hhschu commited on
Commit
01504e9
·
verified ·
1 Parent(s): b70b201

Training in progress, epoch 1

Browse files
Files changed (21) hide show
  1. config.json +1 -1
  2. model-00001-of-00002.safetensors +1 -1
  3. model-00002-of-00002.safetensors +2 -2
  4. model.safetensors.index.json +2 -1
  5. runs/Jan28_13-13-12_ip-172-31-27-247/events.out.tfevents.1738069999.ip-172-31-27-247.32100.0 +3 -0
  6. runs/Jan28_13-14-16_ip-172-31-27-247/events.out.tfevents.1738070064.ip-172-31-27-247.32540.0 +3 -0
  7. runs/Jan28_13-15-28_ip-172-31-27-247/events.out.tfevents.1738070135.ip-172-31-27-247.32910.0 +3 -0
  8. runs/Jan28_13-16-03_ip-172-31-27-247/events.out.tfevents.1738070170.ip-172-31-27-247.33225.0 +3 -0
  9. runs/Jan28_13-16-54_ip-172-31-27-247/events.out.tfevents.1738070221.ip-172-31-27-247.33551.0 +3 -0
  10. runs/Jan28_13-17-31_ip-172-31-27-247/events.out.tfevents.1738070258.ip-172-31-27-247.33880.0 +3 -0
  11. runs/Jan28_13-18-09_ip-172-31-27-247/events.out.tfevents.1738070296.ip-172-31-27-247.34205.0 +3 -0
  12. runs/Jan28_13-21-58_ip-172-31-27-247/events.out.tfevents.1738070528.ip-172-31-27-247.34674.0 +3 -0
  13. runs/Jan28_13-23-08_ip-172-31-27-247/events.out.tfevents.1738070598.ip-172-31-27-247.35102.0 +3 -0
  14. runs/Jan28_13-24-21_ip-172-31-27-247/events.out.tfevents.1738070671.ip-172-31-27-247.35631.0 +3 -0
  15. runs/Jan28_13-29-15_ip-172-31-27-247/events.out.tfevents.1738070965.ip-172-31-27-247.36065.0 +3 -0
  16. runs/Jan29_02-12-46_ip-172-31-27-247/events.out.tfevents.1738116777.ip-172-31-27-247.38694.0 +3 -0
  17. runs/Jan29_02-13-56_ip-172-31-27-247/events.out.tfevents.1738116846.ip-172-31-27-247.39125.0 +3 -0
  18. runs/Jan29_02-14-33_ip-172-31-27-247/events.out.tfevents.1738116884.ip-172-31-27-247.39550.0 +3 -0
  19. runs/Jan29_02-15-14_ip-172-31-27-247/events.out.tfevents.1738116924.ip-172-31-27-247.39975.0 +3 -0
  20. runs/Jan29_02-17-30_ip-172-31-27-247/events.out.tfevents.1738117064.ip-172-31-27-247.40457.0 +3 -0
  21. training_args.bin +2 -2
config.json CHANGED
@@ -31,6 +31,6 @@
31
  "tie_word_embeddings": true,
32
  "torch_dtype": "bfloat16",
33
  "transformers_version": "4.46.3",
34
- "use_cache": true,
35
  "vocab_size": 128256
36
  }
 
31
  "tie_word_embeddings": true,
32
  "torch_dtype": "bfloat16",
33
  "transformers_version": "4.46.3",
34
+ "use_cache": false,
35
  "vocab_size": 128256
36
  }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5659e7d37679476756dcbd94baf11699206dd32a519f063d7e07d00f2d1f487a
3
  size 4965799096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1beab377e4ee892b6e614e72bd6aafa63770b1cdee9e37f47b389fe7a2d50cce
3
  size 4965799096
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea99f35bf1c02c001583e1fb393aca728734569e8b3a2b4ccfdd09a80b10db01
3
- size 1459729952
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8059981fa1d26b15573abce1274ff618545c8ae3e916bea80e995ab74f55f903
3
+ size 2247734992
model.safetensors.index.json CHANGED
@@ -1,8 +1,9 @@
1
  {
2
  "metadata": {
3
- "total_size": 6425499648
4
  },
5
  "weight_map": {
 
6
  "model.embed_tokens.weight": "model-00001-of-00002.safetensors",
7
  "model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors",
8
  "model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 7213504512
4
  },
5
  "weight_map": {
6
+ "lm_head.weight": "model-00002-of-00002.safetensors",
7
  "model.embed_tokens.weight": "model-00001-of-00002.safetensors",
8
  "model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors",
9
  "model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors",
runs/Jan28_13-13-12_ip-172-31-27-247/events.out.tfevents.1738069999.ip-172-31-27-247.32100.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a301fac4786a5c28ed806d45d05299ce83569953a5cfd9853e5a2d5048b7144
3
+ size 5875
runs/Jan28_13-14-16_ip-172-31-27-247/events.out.tfevents.1738070064.ip-172-31-27-247.32540.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30a95964b01186216a41b78ac6aa1e4f0131c613725dd4f4d8c0da0e962a785f
3
+ size 5667
runs/Jan28_13-15-28_ip-172-31-27-247/events.out.tfevents.1738070135.ip-172-31-27-247.32910.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc188043c246e4041ddc018873bab92273a433f60b35e777d56f273704b58624
3
+ size 5665
runs/Jan28_13-16-03_ip-172-31-27-247/events.out.tfevents.1738070170.ip-172-31-27-247.33225.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bf28b6872c8f211e64350015d3940dc13426b7e0153f86d44f5cf824654a343
3
+ size 5665
runs/Jan28_13-16-54_ip-172-31-27-247/events.out.tfevents.1738070221.ip-172-31-27-247.33551.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aa8592d9d2ede51db89e6db3ef18e92f1797a907fb570bc44689c574dca6b03
3
+ size 5665
runs/Jan28_13-17-31_ip-172-31-27-247/events.out.tfevents.1738070258.ip-172-31-27-247.33880.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2be4dd6c0a8e94e6f3b606b5aa56120679eec9c971c7635aeaed7c4cef20c36
3
+ size 5665
runs/Jan28_13-18-09_ip-172-31-27-247/events.out.tfevents.1738070296.ip-172-31-27-247.34205.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315a1e3543c3a20aaeb8565b1795d47ac5584403b2dce336a8e9fd5847f0691f
3
+ size 5665
runs/Jan28_13-21-58_ip-172-31-27-247/events.out.tfevents.1738070528.ip-172-31-27-247.34674.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec923c92a03f56cf3719e9a615febac933a973df083334eca46a586ebc2134ad
3
+ size 5665
runs/Jan28_13-23-08_ip-172-31-27-247/events.out.tfevents.1738070598.ip-172-31-27-247.35102.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0efb8a05d4020eeddb13d76ba95f611d80658506d0204d171939a40fdc9f8944
3
+ size 5876
runs/Jan28_13-24-21_ip-172-31-27-247/events.out.tfevents.1738070671.ip-172-31-27-247.35631.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:954a6049e60bfd3c7af90055362eadeaf3f712b958d31cd28e73548dba18465d
3
+ size 5663
runs/Jan28_13-29-15_ip-172-31-27-247/events.out.tfevents.1738070965.ip-172-31-27-247.36065.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bead1a3cfb0074a9ea11e945f32cd7f69809292f8629c7b09beb24ea99e5ade3
3
+ size 125412
runs/Jan29_02-12-46_ip-172-31-27-247/events.out.tfevents.1738116777.ip-172-31-27-247.38694.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d462bb712b1c910b2a76da4b5e729f7245ab0e2ce07daafc92f90e256b6f774d
3
+ size 5662
runs/Jan29_02-13-56_ip-172-31-27-247/events.out.tfevents.1738116846.ip-172-31-27-247.39125.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f1c8109e1fa8790e42f3545a0b844c8c5b7ba3a5edba77facbfbe060c007222
3
+ size 5664
runs/Jan29_02-14-33_ip-172-31-27-247/events.out.tfevents.1738116884.ip-172-31-27-247.39550.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a46e558d0d05462dde5144aa224c13b820ed7183ef254001d2265c599a797c6f
3
+ size 5663
runs/Jan29_02-15-14_ip-172-31-27-247/events.out.tfevents.1738116924.ip-172-31-27-247.39975.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8b9830a61b467cd23a151e456dc8f63072df096e3adde92d519289ef1d9e56b
3
+ size 5662
runs/Jan29_02-17-30_ip-172-31-27-247/events.out.tfevents.1738117064.ip-172-31-27-247.40457.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fe66f214690274f5c7edc844ad7cbc94e2b989925eba76ceb54395dc49c6a17
3
+ size 471237
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cfbd9c6a6058f26f66ebda9f9629ca23eff1fc99d4d1c06c9e0cad1b3e34298
3
- size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4fdf4fd260cf9e8fbf76f39401fc46927fd57a8e9c182403767a89396e3cac0
3
+ size 6904