andyjzhao commited on
Commit
ec60bf4
·
verified ·
1 Parent(s): 475bd73

Upload folder using huggingface_hub

Browse files
checkpoint-20/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d76997c5c7ec0559b0a17d06e5b50b2feac552b8961ba2f07364561f6d547ef
3
  size 558664971
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81b058994c7bb01c1974d22357374a9fcaa0183d790223af50af90811785860c
3
  size 558664971
checkpoint-20/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:129016d30aa705b92e6102d79906622950127aaa87e5a4c618c7cbb4f6ee188f
3
  size 279336283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:816ae2edf36355d926b630d48a4a45b67f1986fecc140c4dbd67b92e8acb7e68
3
  size 279336283
checkpoint-20/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52e7a1fb60ae8bfda35fbaf20a1fa4b5ee1f711ba533efbed972766f18d6fbe2
3
- size 16359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b52f36f0d65f68e848f95af11c72cdc4e8a1e2cb2e5a2889df74b6af1f5f8006
3
+ size 14709
checkpoint-20/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "best_global_step": 20,
3
- "best_metric": 15562359.077386793,
4
- "best_model_checkpoint": "/gpfs/scratch/guoh/DNAFM/output/gencode_human_12.8k_12800/CKPT_DEBUG/checkpoint-20",
5
  "epoch": 0.0007091444172605751,
6
  "eval_steps": 10,
7
  "global_step": 20,
@@ -13,57 +13,57 @@
13
  "comp/rl_weight": 0.03,
14
  "comp/strictness": 0.0,
15
  "epoch": 0.00035457220863028757,
16
- "grad_norm": 1504.030029296875,
17
- "loss": 87.8092,
18
- "loss_ce": 59.68216323852539,
19
- "loss_region": 0.0935576930642128,
20
- "loss_total": 59.77572250366211,
21
  "lr": 2.20454076850486e-05,
22
- "router/selected_tokens_s0": 793.03125,
23
- "router/selected_tokens_s1": 148.84375,
24
  "step": 10,
25
  "tokens_trained": 0.00409568
26
  },
27
  {
28
  "epoch": 0.00035457220863028757,
29
- "eval_ppl": 9.153268951196861e+22,
30
- "eval_runtime": 4.9797,
31
  "step": 10,
32
  "tokens_trained": 0.00409568
33
  },
34
  {
35
  "epoch": 0.00035457220863028757,
36
- "eval_F": 0.00177827022776477,
37
- "eval_F_cds": 0.003658417655291659,
38
- "eval_F_dig": 0.0012045211865510327,
39
- "eval_F_exon": 0.0016746678575415876,
40
- "eval_F_intron": 0.001447564894073858,
41
- "eval_F_nig": 0.0013862277187481856,
42
- "eval_F_promoter": 0.0033154658131890054,
43
- "eval_F_utr": 0.0016332169397963454,
44
- "eval_G": 0.011702613646642867,
45
- "eval_G_cds": 0.023833423264492,
46
- "eval_G_dig": 0.009547610734562596,
47
- "eval_G_exon": 0.01037959719586171,
48
- "eval_G_intron": 0.008864032313383523,
49
- "eval_G_nig": 0.008525809138569675,
50
- "eval_G_promoter": 0.02530388628896865,
51
- "eval_G_utr": 0.010295956315471365,
52
- "eval_avg_bp_per_token": 562.3442288953848,
53
- "eval_bp_per_token/cds": 273.34221902017293,
54
- "eval_bp_per_token/dig": 830.2054054054054,
55
- "eval_bp_per_token/exon": 597.1333333333333,
56
- "eval_bp_per_token/intron": 690.8153161864243,
57
- "eval_bp_per_token/nig": 721.3821989528795,
58
- "eval_bp_per_token/promoter": 301.61674296926094,
59
- "eval_bp_per_token/utr": 612.2885304659499,
60
- "eval_ppl_cds": 6.414658338854343e+21,
61
- "eval_ppl_dig": 4.0669318513627916e+21,
62
- "eval_ppl_exon": 2.4904150523692485e+23,
63
- "eval_ppl_intron": 1.535523404049312e+23,
64
- "eval_ppl_nig": 7.19246164907062e+23,
65
- "eval_ppl_promoter": 1.0487349115377585e+21,
66
- "eval_ppl_utr": 3.14597976396868e+23,
67
  "step": 10,
68
  "tokens_trained": 0.00409568
69
  },
@@ -71,11 +71,11 @@
71
  "comp/rl_weight": 0.03,
72
  "comp/strictness": 0.0,
73
  "epoch": 0.0007091444172605751,
74
- "grad_norm": 566.407958984375,
75
- "loss": 41.7086,
76
- "loss_ce": 21.22186279296875,
77
- "loss_region": 0.10101450234651566,
78
- "loss_total": 21.322877883911133,
79
  "lr": 4.654030511288038e-05,
80
  "router/selected_tokens_s0": 1.0,
81
  "router/selected_tokens_s1": 1.0,
@@ -84,8 +84,8 @@
84
  },
85
  {
86
  "epoch": 0.0007091444172605751,
87
- "eval_ppl": 15562359.077386793,
88
- "eval_runtime": 4.5207,
89
  "step": 20,
90
  "tokens_trained": 0.00819136
91
  },
@@ -99,9 +99,9 @@
99
  "eval_F_nig": 8.365496566708533e-05,
100
  "eval_F_promoter": 4.770454407466195e-05,
101
  "eval_F_utr": 7.9026626119178e-05,
102
- "eval_G": 7.816417754056831e-05,
103
  "eval_G_cds": 4.744345662481978e-05,
104
- "eval_G_dig": 8.086518396619527e-05,
105
  "eval_G_exon": 6.977782739756614e-05,
106
  "eval_G_intron": 8.580132276805985e-05,
107
  "eval_G_nig": 8.365496566708533e-05,
@@ -115,13 +115,13 @@
115
  "eval_bp_per_token/nig": 11953.86301369863,
116
  "eval_bp_per_token/promoter": 20962.363636363636,
117
  "eval_bp_per_token/utr": 12653.962962962964,
118
- "eval_ppl_cds": 5593566.178288604,
119
- "eval_ppl_dig": 35486712.16234024,
120
- "eval_ppl_exon": 17259683.491786722,
121
- "eval_ppl_intron": 17053510.68256213,
122
- "eval_ppl_nig": 19611828.658571318,
123
- "eval_ppl_promoter": 9113844.845808096,
124
- "eval_ppl_utr": 14151555.844300926,
125
  "step": 20,
126
  "tokens_trained": 0.00819136
127
  }
 
1
  {
2
  "best_global_step": 20,
3
+ "best_metric": 148816.18235103838,
4
+ "best_model_checkpoint": "/network/scratch/j/jianan.zhao/DNAFM/output/gencode_human_12.8k_12800/CKPT_DEBUG/checkpoint-20",
5
  "epoch": 0.0007091444172605751,
6
  "eval_steps": 10,
7
  "global_step": 20,
 
13
  "comp/rl_weight": 0.03,
14
  "comp/strictness": 0.0,
15
  "epoch": 0.00035457220863028757,
16
+ "grad_norm": 1111.61279296875,
17
+ "loss": 146.1968,
18
+ "loss_ce": 54.305824279785156,
19
+ "loss_region": 0.10640381276607513,
20
+ "loss_total": 54.412227630615234,
21
  "lr": 2.20454076850486e-05,
22
+ "router/selected_tokens_s0": 21.6875,
23
+ "router/selected_tokens_s1": 1.0,
24
  "step": 10,
25
  "tokens_trained": 0.00409568
26
  },
27
  {
28
  "epoch": 0.00035457220863028757,
29
+ "eval_ppl": 7.424721446549467e+17,
30
+ "eval_runtime": 7.6118,
31
  "step": 10,
32
  "tokens_trained": 0.00409568
33
  },
34
  {
35
  "epoch": 0.00035457220863028757,
36
+ "eval_F": 7.813110399249941e-05,
37
+ "eval_F_cds": 4.744345662481978e-05,
38
+ "eval_F_dig": 7.813110399249941e-05,
39
+ "eval_F_exon": 6.977782739756614e-05,
40
+ "eval_F_intron": 8.580132276805985e-05,
41
+ "eval_F_nig": 8.365496566708533e-05,
42
+ "eval_F_promoter": 4.770454407466195e-05,
43
+ "eval_F_utr": 7.9026626119178e-05,
44
+ "eval_G": 0.00015868149956862495,
45
+ "eval_G_cds": 0.00015302779857089767,
46
+ "eval_G_dig": 0.00013616989934109436,
47
+ "eval_G_exon": 0.0001662856506549812,
48
+ "eval_G_intron": 0.00016059590085930095,
49
+ "eval_G_nig": 0.00015651285421575188,
50
+ "eval_G_promoter": 0.00015211858489077828,
51
+ "eval_G_utr": 0.00018231460938894855,
52
+ "eval_avg_bp_per_token": 12799.0,
53
+ "eval_bp_per_token/cds": 21077.722222222223,
54
+ "eval_bp_per_token/dig": 12799.0,
55
+ "eval_bp_per_token/exon": 14331.2,
56
+ "eval_bp_per_token/intron": 11654.831973898858,
57
+ "eval_bp_per_token/nig": 11953.86301369863,
58
+ "eval_bp_per_token/promoter": 20962.363636363636,
59
+ "eval_bp_per_token/utr": 12653.962962962964,
60
+ "eval_ppl_cds": 2.4835679876749204e+20,
61
+ "eval_ppl_dig": 9.028849885879438e+16,
62
+ "eval_ppl_exon": 2.2687957801872694e+18,
63
+ "eval_ppl_intron": 2.8188580486001277e+17,
64
+ "eval_ppl_nig": 1.1219396355209006e+17,
65
+ "eval_ppl_promoter": 1.6162428794991283e+20,
66
+ "eval_ppl_utr": 4.3084586855038605e+17,
67
  "step": 10,
68
  "tokens_trained": 0.00409568
69
  },
 
71
  "comp/rl_weight": 0.03,
72
  "comp/strictness": 0.0,
73
  "epoch": 0.0007091444172605751,
74
+ "grad_norm": 330.2630310058594,
75
+ "loss": 25.8642,
76
+ "loss_ce": 12.18574047088623,
77
+ "loss_region": 0.09936444461345673,
78
+ "loss_total": 12.285104751586914,
79
  "lr": 4.654030511288038e-05,
80
  "router/selected_tokens_s0": 1.0,
81
  "router/selected_tokens_s1": 1.0,
 
84
  },
85
  {
86
  "epoch": 0.0007091444172605751,
87
+ "eval_ppl": 148816.18235103838,
88
+ "eval_runtime": 7.2278,
89
  "step": 20,
90
  "tokens_trained": 0.00819136
91
  },
 
99
  "eval_F_nig": 8.365496566708533e-05,
100
  "eval_F_promoter": 4.770454407466195e-05,
101
  "eval_F_utr": 7.9026626119178e-05,
102
+ "eval_G": 7.813110399249941e-05,
103
  "eval_G_cds": 4.744345662481978e-05,
104
+ "eval_G_dig": 7.813110399249941e-05,
105
  "eval_G_exon": 6.977782739756614e-05,
106
  "eval_G_intron": 8.580132276805985e-05,
107
  "eval_G_nig": 8.365496566708533e-05,
 
115
  "eval_bp_per_token/nig": 11953.86301369863,
116
  "eval_bp_per_token/promoter": 20962.363636363636,
117
  "eval_bp_per_token/utr": 12653.962962962964,
118
+ "eval_ppl_cds": 395673.42673693807,
119
+ "eval_ppl_dig": 31301.43244868628,
120
+ "eval_ppl_exon": 140758.6210649053,
121
+ "eval_ppl_intron": 122319.47964181146,
122
+ "eval_ppl_nig": 111897.23080114595,
123
+ "eval_ppl_promoter": 421597.51324185927,
124
+ "eval_ppl_utr": 202983.65571501417,
125
  "step": 20,
126
  "tokens_trained": 0.00819136
127
  }
checkpoint-20/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:faf9107e8232f8c02d0de570892b7fdd717781cc6eb0d429077eedff87e08462
3
  size 5969
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09a783c7f9bdabaac56f2ebff5b9206706ee40f8914b7eb767a104570a9abfac
3
  size 5969