explcre commited on
Commit
90dde69
·
verified ·
1 Parent(s): 3010e95

Upload exp_phase8_bridge_recipeABC_KDmatrix_205425/log.jsonl with huggingface_hub

Browse files
exp_phase8_bridge_recipeABC_KDmatrix_205425/log.jsonl ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {"step": 0, "loss": 1.4807003736495972, "loss_mdlm": 1.2960470914840698, "loss_lm": 1.8465330600738525, "loss_ct": 0.0, "lr": 0.0, "gnorm": 0.7072781324386597, "bridge_gate_avg": 1.0, "bridge_out_proj_avg": 0.0, "elapsed_s": 3.3111066818237305}
2
+ {"step": 100, "loss": 1.4608423709869385, "loss_mdlm": 1.3450387716293335, "loss_lm": 1.1580358743667603, "loss_ct": 0.0, "lr": 2.5e-05, "gnorm": 0.8035140037536621, "bridge_gate_avg": 1.0007514953613281, "bridge_out_proj_avg": 0.0003448505958658643, "elapsed_s": 39.40489959716797}
3
+ {"step": 200, "loss": 1.4772427082061768, "loss_mdlm": 1.3282194137573242, "loss_lm": 1.490233063697815, "loss_ct": 0.0, "lr": 5e-05, "gnorm": 0.8526065349578857, "bridge_gate_avg": 1.003314197063446, "bridge_out_proj_avg": 0.0015859982231631875, "elapsed_s": 72.99261283874512}
4
+ {"step": 300, "loss": 1.3764095306396484, "loss_mdlm": 1.3097258806228638, "loss_lm": 0.6668360829353333, "loss_ct": 0.0, "lr": 4.962019382530521e-05, "gnorm": 0.5771306157112122, "bridge_gate_avg": 1.0041352212429047, "bridge_out_proj_avg": 0.0018417016544844955, "elapsed_s": 105.98136472702026}
5
+ {"step": 400, "loss": 1.4581562280654907, "loss_mdlm": 1.3705295324325562, "loss_lm": 0.8762664794921875, "loss_ct": 0.0, "lr": 4.849231551964771e-05, "gnorm": 0.637607216835022, "bridge_gate_avg": 1.0048262476921082, "bridge_out_proj_avg": 0.0019542877562344074, "elapsed_s": 139.34164690971375}
6
+ {"step": 500, "loss": 1.4199573993682861, "loss_mdlm": 1.340954065322876, "loss_lm": 0.7900329828262329, "loss_ct": 0.0, "lr": 4.665063509461097e-05, "gnorm": 0.6488635540008545, "bridge_gate_avg": 1.0060576498508453, "bridge_out_proj_avg": 0.002071397437248379, "elapsed_s": 171.13466668128967}
7
+ {"step": 600, "loss": 1.4259397983551025, "loss_mdlm": 1.355509877204895, "loss_lm": 0.7042996287345886, "loss_ct": 0.0, "lr": 4.415111107797445e-05, "gnorm": 0.47471004724502563, "bridge_gate_avg": 1.0071673691272736, "bridge_out_proj_avg": 0.002137564937584102, "elapsed_s": 202.75241422653198}
8
+ {"step": 700, "loss": 1.3947677612304688, "loss_mdlm": 1.3226498365402222, "loss_lm": 0.7211797833442688, "loss_ct": 0.0, "lr": 4.1069690242163484e-05, "gnorm": 0.5088882446289062, "bridge_gate_avg": 1.0083767473697662, "bridge_out_proj_avg": 0.0022153593017719686, "elapsed_s": 234.74259281158447}
9
+ {"step": 800, "loss": 1.4010770320892334, "loss_mdlm": 1.2996689081192017, "loss_lm": 1.0140811204910278, "loss_ct": 0.0, "lr": 3.7500000000000003e-05, "gnorm": 0.6771104335784912, "bridge_gate_avg": 1.0091662406921387, "bridge_out_proj_avg": 0.002285940747242421, "elapsed_s": 266.46807384490967}