sedrickkeh commited on
Commit
8180e09
·
verified ·
1 Parent(s): 78eb4d4

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef1db9e9c5585d5670e2cd7467b49f085ec03de20b8aa4c42a47a620361b8981
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bafc57fcaa812d63cc1e3c128e986d0c3ff8659a168d20769bdb06af7ec9ecf0
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b98f8c900e3c683c7b0388eb622b68cbcda48a6fac71efcc2d55ba7ad4e34f8
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30c4873be68ffc42d232a9939b1804d465585089803fcd8c878843ea0a674b5b
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4101a5f257639f3d2f6af33eff7186d2686233153bea06996fc727ee87b325b
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ce62bbcb44cac955a29e1f654a6a28877d3c539b31349933a7e7313126125cb
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:958c82a09952ffb442237febc205399cd4d843c8571b5ff7c10733576d775a10
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67bec0fe378744916e9791f8b17f5743519b45aaad4cfc787eda4fe433ebaf37
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -8,3 +8,9 @@
8
  {"current_steps": 70, "total_steps": 123, "loss": 0.7662, "lr": 5e-06, "epoch": 1.6816816816816815, "percentage": 56.91, "elapsed_time": "0:38:48", "remaining_time": "0:29:23"}
9
  {"current_steps": 80, "total_steps": 123, "loss": 0.7594, "lr": 5e-06, "epoch": 1.921921921921922, "percentage": 65.04, "elapsed_time": "0:44:04", "remaining_time": "0:23:41"}
10
  {"current_steps": 83, "total_steps": 123, "eval_loss": 0.777886688709259, "epoch": 1.993993993993994, "percentage": 67.48, "elapsed_time": "0:46:10", "remaining_time": "0:22:15"}
 
 
 
 
 
 
 
8
  {"current_steps": 70, "total_steps": 123, "loss": 0.7662, "lr": 5e-06, "epoch": 1.6816816816816815, "percentage": 56.91, "elapsed_time": "0:38:48", "remaining_time": "0:29:23"}
9
  {"current_steps": 80, "total_steps": 123, "loss": 0.7594, "lr": 5e-06, "epoch": 1.921921921921922, "percentage": 65.04, "elapsed_time": "0:44:04", "remaining_time": "0:23:41"}
10
  {"current_steps": 83, "total_steps": 123, "eval_loss": 0.777886688709259, "epoch": 1.993993993993994, "percentage": 67.48, "elapsed_time": "0:46:10", "remaining_time": "0:22:15"}
11
+ {"current_steps": 90, "total_steps": 123, "loss": 0.755, "lr": 5e-06, "epoch": 2.1621621621621623, "percentage": 73.17, "elapsed_time": "0:51:02", "remaining_time": "0:18:42"}
12
+ {"current_steps": 100, "total_steps": 123, "loss": 0.7095, "lr": 5e-06, "epoch": 2.4024024024024024, "percentage": 81.3, "elapsed_time": "0:56:18", "remaining_time": "0:12:57"}
13
+ {"current_steps": 110, "total_steps": 123, "loss": 0.7074, "lr": 5e-06, "epoch": 2.6426426426426426, "percentage": 89.43, "elapsed_time": "1:01:33", "remaining_time": "0:07:16"}
14
+ {"current_steps": 120, "total_steps": 123, "loss": 0.7082, "lr": 5e-06, "epoch": 2.8828828828828827, "percentage": 97.56, "elapsed_time": "1:06:51", "remaining_time": "0:01:40"}
15
+ {"current_steps": 123, "total_steps": 123, "eval_loss": 0.7722160816192627, "epoch": 2.954954954954955, "percentage": 100.0, "elapsed_time": "1:10:13", "remaining_time": "0:00:00"}
16
+ {"current_steps": 123, "total_steps": 123, "epoch": 2.954954954954955, "percentage": 100.0, "elapsed_time": "1:11:26", "remaining_time": "0:00:00"}