explcre commited on
Commit
0480da9
·
verified ·
1 Parent(s): b747e86

Upload exp_phase8_bridge_recipeAB_300step_035043/log.jsonl with huggingface_hub

Browse files
exp_phase8_bridge_recipeAB_300step_035043/log.jsonl ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"step": 0, "loss": 2.193673610687256, "loss_mdlm": 1.2750681638717651, "loss_lm": 1.8372111320495605, "loss_ct": 0.0, "lr": 0.0, "gnorm": 3.5073776245117188, "bridge_gate_avg": 1.0, "bridge_out_proj_avg": 0.0, "elapsed_s": 3.2642288208007812}
2
+ {"step": 25, "loss": 1.4827123880386353, "loss_mdlm": 0.7698311805725098, "loss_lm": 1.425762414932251, "loss_ct": 0.0, "lr": 4.166666666666667e-05, "gnorm": 2.463526725769043, "bridge_gate_avg": 1.0003358125686646, "bridge_out_proj_avg": 0.00018468878261046484, "elapsed_s": 15.403388500213623}
3
+ {"step": 50, "loss": 2.0127530097961426, "loss_mdlm": 1.4222482442855835, "loss_lm": 1.1810096502304077, "loss_ct": 0.0, "lr": 4.9326121764495596e-05, "gnorm": 3.826711654663086, "bridge_gate_avg": 1.0003427565097809, "bridge_out_proj_avg": 0.0003076296197832562, "elapsed_s": 27.7360782623291}
4
+ {"step": 75, "loss": 1.8004859685897827, "loss_mdlm": 1.2991610765457153, "loss_lm": 1.0026497840881348, "loss_ct": 0.0, "lr": 4.665063509461097e-05, "gnorm": 3.2806148529052734, "bridge_gate_avg": 1.001010239124298, "bridge_out_proj_avg": 0.0005621169984806329, "elapsed_s": 39.93375277519226}
5
+ {"step": 100, "loss": 1.835280179977417, "loss_mdlm": 1.3513433933258057, "loss_lm": 0.9678735733032227, "loss_ct": 0.0, "lr": 4.215604094671835e-05, "gnorm": 3.1473264694213867, "bridge_gate_avg": 1.0016477406024933, "bridge_out_proj_avg": 0.0008466819708701223, "elapsed_s": 51.92164921760559}
6
+ {"step": 125, "loss": 1.8027596473693848, "loss_mdlm": 1.2959831953048706, "loss_lm": 1.0135530233383179, "loss_ct": 0.0, "lr": 3.621997950501156e-05, "gnorm": 3.325122356414795, "bridge_gate_avg": 1.0016797482967377, "bridge_out_proj_avg": 0.0009088016231544316, "elapsed_s": 63.76001238822937}
7
+ {"step": 150, "loss": 1.7762501239776611, "loss_mdlm": 1.2832350730895996, "loss_lm": 0.986030101776123, "loss_ct": 0.0, "lr": 2.9341204441673266e-05, "gnorm": 3.2671163082122803, "bridge_gate_avg": 1.002065271139145, "bridge_out_proj_avg": 0.0010643154091667384, "elapsed_s": 75.7668809890747}
8
+ {"step": 175, "loss": 1.728819727897644, "loss_mdlm": 1.2991365194320679, "loss_lm": 0.8593663573265076, "loss_ct": 0.0, "lr": 2.2097677146869242e-05, "gnorm": 3.0293920040130615, "bridge_gate_avg": 1.0024825930595398, "bridge_out_proj_avg": 0.001225507934577763, "elapsed_s": 87.60593366622925}
9
+ {"step": 200, "loss": 2.012921094894409, "loss_mdlm": 1.318852424621582, "loss_lm": 1.3881372213363647, "loss_ct": 0.0, "lr": 1.509800584902108e-05, "gnorm": 3.447014808654785, "bridge_gate_avg": 1.0027942657470703, "bridge_out_proj_avg": 0.0013518164050765336, "elapsed_s": 99.44173336029053}
10
+ {"step": 225, "loss": 1.9684042930603027, "loss_mdlm": 1.3210722208023071, "loss_lm": 1.2946640253067017, "loss_ct": 0.0, "lr": 8.930309757836517e-06, "gnorm": 4.009990215301514, "bridge_gate_avg": 1.0028858184814453, "bridge_out_proj_avg": 0.0013838975282851607, "elapsed_s": 111.39192724227905}
11
+ {"step": 250, "loss": 1.7437763214111328, "loss_mdlm": 1.3057974576950073, "loss_lm": 0.8759578466415405, "loss_ct": 0.0, "lr": 4.112804714676594e-06, "gnorm": 3.569528341293335, "bridge_gate_avg": 1.002962052822113, "bridge_out_proj_avg": 0.0014074042555876076, "elapsed_s": 123.27344846725464}
12
+ {"step": 275, "loss": 1.6434921026229858, "loss_mdlm": 1.3705134391784668, "loss_lm": 0.5459573864936829, "loss_ct": 0.0, "lr": 1.0502621921127776e-06, "gnorm": 2.482496500015259, "bridge_gate_avg": 1.00298011302948, "bridge_out_proj_avg": 0.001414461905369535, "elapsed_s": 134.3349871635437}