explcre commited on
Commit
c66ff97
·
verified ·
1 Parent(s): f658d35

Upload exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s2_par_20260506_221253/log.jsonl with huggingface_hub

Browse files
exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s2_par_20260506_221253/log.jsonl CHANGED
@@ -1 +1,11 @@
1
  {"step": 1, "loss": 99.54866027832031, "mean_r": -0.8137362599372864, "max_r": -0.6333333253860474, "mean_grounded": 0.25, "mean_halluc": 9.5, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.019230769230769232, "gnorm": 417.38580322265625, "elapsed_s": 49.00086331367493, "cell": "Oli", "id": "train:edit:Oli:ARL6IP4:chr12_122839369_122839869:3262"}
 
 
 
 
 
 
 
 
 
 
 
1
  {"step": 1, "loss": 99.54866027832031, "mean_r": -0.8137362599372864, "max_r": -0.6333333253860474, "mean_grounded": 0.25, "mean_halluc": 9.5, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.019230769230769232, "gnorm": 417.38580322265625, "elapsed_s": 49.00086331367493, "cell": "Oli", "id": "train:edit:Oli:ARL6IP4:chr12_122839369_122839869:3262"}
2
+ {"step": 5, "loss": 45.6891975402832, "mean_r": -0.8527777791023254, "max_r": -0.6666666865348816, "mean_grounded": 0.0, "mean_halluc": 8.75, "mean_cited": 9.25, "mean_tf_grounded_rate": 0.0, "gnorm": 334.50396728515625, "elapsed_s": 184.91056060791016, "cell": "Ex", "id": "train:edit:Ex:DNAAF1:chr16_84178560_84179060:1583"}
3
+ {"step": 10, "loss": -151.15805053710938, "mean_r": -0.6806226968765259, "max_r": -0.47999998927116394, "mean_grounded": 1.0, "mean_halluc": 11.0, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.08846153846153847, "gnorm": 564.0594482421875, "elapsed_s": 359.7687704563141, "cell": "Ex", "id": "train:edit:Ex:MLLT6:chr17_38868079_38868579:1284"}
4
+ {"step": 15, "loss": -66.16642761230469, "mean_r": -0.3159523904323578, "max_r": 0.3333333432674408, "mean_grounded": 1.5, "mean_halluc": 6.25, "mean_cited": 8.25, "mean_tf_grounded_rate": 0.2669642857142857, "gnorm": 283.5673522949219, "elapsed_s": 530.5415060520172, "cell": "Ast", "id": "train:edit:Ast:DNAJC24:chr11_31243512_31244012:3637"}
5
+ {"step": 20, "loss": 65.90116882324219, "mean_r": -0.596795916557312, "max_r": -0.30000001192092896, "mean_grounded": 2.0, "mean_halluc": 25.5, "mean_cited": 27.75, "mean_tf_grounded_rate": 0.1682213751438435, "gnorm": 531.0924682617188, "elapsed_s": 700.5572099685669, "cell": "Ast", "id": "train:edit:Ast:IFITM10:chr11_1855490_1855990:1025"}
6
+ {"step": 25, "loss": -130.81112670898438, "mean_r": -0.14208334684371948, "max_r": 1.0, "mean_grounded": 2.75, "mean_halluc": 6.5, "mean_cited": 9.25, "mean_tf_grounded_rate": 0.40208333333333335, "gnorm": 300.39093017578125, "elapsed_s": 873.0645732879639, "cell": "Ast", "id": "train:edit:Ast:SPARCL1:chr4_87483231_87483731:281"}
7
+ {"step": 30, "loss": -46.04944610595703, "mean_r": -0.47860753536224365, "max_r": 0.0, "mean_grounded": 1.5, "mean_halluc": 10.25, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.09505772005772006, "gnorm": 236.1367645263672, "elapsed_s": 1055.0520577430725, "cell": "Mic", "id": "train:edit:Mic:BRD7:chr16_50312442_50312942:2718"}
8
+ {"step": 35, "loss": -91.60397338867188, "mean_r": -0.7679486870765686, "max_r": -0.5, "mean_grounded": 0.5, "mean_halluc": 10.25, "mean_cited": 11.0, "mean_tf_grounded_rate": 0.03571428571428571, "gnorm": 478.71514892578125, "elapsed_s": 1211.2856006622314, "cell": "Ast", "id": "train:edit:Ast:LINC01136:chr1_203146515_203147015:2070"}
9
+ {"step": 40, "loss": 28.521331787109375, "mean_r": -0.5103527903556824, "max_r": -0.17894737422466278, "mean_grounded": 2.75, "mean_halluc": 12.0, "mean_cited": 16.0, "mean_tf_grounded_rate": 0.14325896262395119, "gnorm": 528.1494140625, "elapsed_s": 1381.4892029762268, "cell": "Mic", "id": "train:edit:Mic:MYO1C:chr17_1589953_1590453:367"}
10
+ {"step": 45, "loss": 92.89891815185547, "mean_r": -0.6608928442001343, "max_r": -0.375, "mean_grounded": 1.75, "mean_halluc": 9.0, "mean_cited": 10.75, "mean_tf_grounded_rate": 0.14107142857142857, "gnorm": 368.6761474609375, "elapsed_s": 1560.6473388671875, "cell": "Oli", "id": "train:edit:Oli:RRP9:chr3_52014575_52015075:2797"}
11
+ {"step": 50, "loss": -126.95048522949219, "mean_r": -0.3968142867088318, "max_r": 0.027272727340459824, "mean_grounded": 1.5, "mean_halluc": 8.25, "mean_cited": 11.0, "mean_tf_grounded_rate": 0.2297979797979798, "gnorm": 494.4970397949219, "elapsed_s": 1729.027425289154, "cell": "Mic", "id": "train:edit:Mic:LINC00461:chr5_88824152_88824652:1592"}