daze-unlv commited on
Commit
7f8f047
1 Parent(s): e5d2054

Training in progress, epoch 10

Browse files
log.txt CHANGED
@@ -116,3 +116,17 @@
116
  {'loss': 0.185, 'grad_norm': 16.464384078979492, 'learning_rate': 2.083187492707969e-05, 'epoch': 8.75}
117
  {'loss': 0.1794, 'grad_norm': 20.86390495300293, 'learning_rate': 2.0540193676350487e-05, 'epoch': 8.84}
118
  {'loss': 0.1843, 'grad_norm': 14.848393440246582, 'learning_rate': 2.0248512425621283e-05, 'epoch': 8.93}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
116
  {'loss': 0.185, 'grad_norm': 16.464384078979492, 'learning_rate': 2.083187492707969e-05, 'epoch': 8.75}
117
  {'loss': 0.1794, 'grad_norm': 20.86390495300293, 'learning_rate': 2.0540193676350487e-05, 'epoch': 8.84}
118
  {'loss': 0.1843, 'grad_norm': 14.848393440246582, 'learning_rate': 2.0248512425621283e-05, 'epoch': 8.93}
119
+ [1 2 2 ... 0 2 0] [0 0 2 ... 0 1 0]
120
+ {'eval_loss': 3.4013631343841553, 'eval_accuracy': 0.4159693999521874, 'eval_runtime': 6.5155, 'eval_samples_per_second': 642.004, 'eval_steps_per_second': 20.106, 'epoch': 9.0}
121
+ {'loss': 0.1752, 'grad_norm': 16.65215301513672, 'learning_rate': 1.995683117489208e-05, 'epoch': 9.01}
122
+ {'loss': 0.1354, 'grad_norm': 30.883514404296875, 'learning_rate': 1.9665149924162876e-05, 'epoch': 9.1}
123
+ {'loss': 0.1378, 'grad_norm': 24.399015426635742, 'learning_rate': 1.9373468673433673e-05, 'epoch': 9.19}
124
+ {'loss': 0.1382, 'grad_norm': 10.105205535888672, 'learning_rate': 1.908178742270447e-05, 'epoch': 9.28}
125
+ {'loss': 0.1364, 'grad_norm': 17.550519943237305, 'learning_rate': 1.8790106171975266e-05, 'epoch': 9.36}
126
+ {'loss': 0.1429, 'grad_norm': 14.63619613647461, 'learning_rate': 1.8498424921246062e-05, 'epoch': 9.45}
127
+ {'loss': 0.1484, 'grad_norm': 20.125774383544922, 'learning_rate': 1.820674367051686e-05, 'epoch': 9.54}
128
+ {'loss': 0.1447, 'grad_norm': 9.442309379577637, 'learning_rate': 1.7915062419787655e-05, 'epoch': 9.63}
129
+ {'loss': 0.1441, 'grad_norm': 3.3339831829071045, 'learning_rate': 1.7623381169058455e-05, 'epoch': 9.71}
130
+ {'loss': 0.1422, 'grad_norm': 12.243080139160156, 'learning_rate': 1.733169991832925e-05, 'epoch': 9.8}
131
+ {'loss': 0.1515, 'grad_norm': 8.44780158996582, 'learning_rate': 1.7040018667600048e-05, 'epoch': 9.89}
132
+ {'loss': 0.1478, 'grad_norm': 7.068332672119141, 'learning_rate': 1.6748337416870844e-05, 'epoch': 9.98}
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dcee5d29c3c6cec18051dcfaf82426afc937dc4cdad0f9b2adfdc7fb21cf305
3
  size 267829484
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac30861de0c27028361f5da5d9a0bd97c4cab21faff9986509bda049d847e6ed
3
  size 267829484
runs/Mar14_16-58-52_cehsc-app-001.ad.unlv.edu/events.out.tfevents.1710460734.cehsc-app-001.ad.unlv.edu.4089564.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:740aaa121039875d7f10e7b71a065104da5764aa826854864c3548628c554048
3
- size 29318
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4d163f603a4a4c14b2029c8b0493aca597b4cf8b89ac9aa411ec6ee1656120f
3
+ size 32227