Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl +3 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt +11 -0
- reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt +3 -0
reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 935.0 0.0 935.0 935.0 958.81506 0.0 958.81506 958.81506 0.058018792 0.02861838 0.11931482 0.024831772 -0.031212114 1.4881060123443604
|
| 3 |
+
1 1146.0 0.0 1146.0 1146.0 1089.2394 0.0 1089.2394 1089.2394 3.9360142 0.18713778 4.1525836 3.6220293 0.03685774 2.9063098430633545
|
| 4 |
+
2 1114.0 0.0 1114.0 1114.0 1129.116 0.0 1129.116 1129.116 4.634061 1.1898764 6.277654 3.1035814 -0.010468043 4.320961236953735
|
| 5 |
+
3 1137.0 0.0 1137.0 1137.0 1171.5638 0.0 1171.5638 1171.5638 5.046778 1.535573 7.290665 2.9499335 -0.029821746 5.73552680015564
|
| 6 |
+
4 1117.0 0.0 1117.0 1117.0 1152.1124 0.0 1152.1124 1152.1124 5.3372173 1.4758617 7.717772 3.1613023 -0.042354897 7.1466710567474365
|
| 7 |
+
5 1151.0 0.0 1151.0 1151.0 1193.8174 0.0 1193.8174 1193.8174 5.3494215 1.3711958 7.7694917 3.3517578 -0.048877865 8.583211183547974
|
| 8 |
+
6 1126.0 0.0 1126.0 1126.0 1193.8207 0.0 1193.8207 1193.8207 5.5585713 1.636862 8.501507 3.173237 -0.07759775 9.99778699874878
|
| 9 |
+
7 1131.0 0.0 1131.0 1131.0 1160.9905 0.0 1160.9905 1160.9905 5.5605564 1.6539116 8.630872 3.356909 -0.0351999 11.410574913024902
|
| 10 |
+
8 1133.0 0.0 1133.0 1133.0 1136.8328 0.0 1136.8328 1136.8328 5.423081 1.663091 8.643065 2.9460669 -0.004513502 12.855329751968384
|
| 11 |
+
9 1163.0 0.0 1163.0 1163.0 1163.4518 0.0 1163.4518 1163.4518 5.352908 1.4534807 8.235616 3.1853917 -0.0005123764 14.319170713424683
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4325203f7d75ec91fb7df19a6593e34ef3454953d7bfa31f4992975d799e0662
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 1012.0 0.0 1012.0 1012.0 1050.8109 0.0 1050.8109 1050.8109 0.21133251 0.04107647 0.2794286 0.15483904 -0.031223506 1.6694228649139404
|
| 3 |
+
1 1130.0 0.0 1130.0 1130.0 1157.7743 0.0 1157.7743 1157.7743 4.3821545 0.3579786 4.816786 3.5450249 -0.014633879 3.348346710205078
|
| 4 |
+
2 1114.0 0.0 1114.0 1114.0 1204.0416 0.0 1204.0416 1204.0416 5.1830187 1.3640116 6.9855337 2.831925 -0.047540292 5.014883995056152
|
| 5 |
+
3 1129.0 0.0 1129.0 1129.0 1185.5929 0.0 1185.5929 1185.5929 5.467668 1.5511539 7.6260467 2.7476642 -0.029786244 6.683060169219971
|
| 6 |
+
4 1123.0 0.0 1123.0 1123.0 1178.2816 0.0 1178.2816 1178.2816 5.4397106 1.5729288 7.691392 2.9557455 -0.029095694 8.350719928741455
|
| 7 |
+
5 1134.0 0.0 1134.0 1134.0 1193.5576 0.0 1193.5576 1193.5576 5.3784876 1.7434099 7.976144 2.0719204 -0.03137976 10.01439356803894
|
| 8 |
+
6 1162.0 0.0 1162.0 1162.0 1231.5813 0.0 1231.5813 1231.5813 5.460224 1.8280329 8.46003 2.0440905 -0.036641836 11.68005084991455
|
| 9 |
+
7 1130.0 0.0 1130.0 1130.0 1275.5763 0.0 1275.5763 1275.5763 5.61514 1.7658131 8.56203 2.333252 -0.07661867 13.358151912689209
|
| 10 |
+
8 1152.0 0.0 1152.0 1152.0 1246.6604 0.0 1246.6604 1246.6604 5.9103584 1.5978097 8.620821 2.842272 -0.04984729 15.018638610839844
|
| 11 |
+
9 1160.0 0.0 1160.0 1160.0 1177.7042 0.0 1177.7042 1177.7042 5.785543 1.8555775 8.866861 2.2370443 -0.009317651 16.680999755859375
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc33fca07daa81c960cc0f5980a80d597b19271dd94407c2f94bf6a64f16cd3e
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=0_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:770168b3aaef05c84af851d3036d265dcee4f037db63d5c1823616342f1a4a47
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 953.0 0.0 953.0 953.0 1001.78564 0.0 1001.78564 1001.78564 0.064820394 0.030788934 0.12834144 0.025601551 -0.05361031 1.6537342071533203
|
| 3 |
+
1 1244.0 0.0 1244.0 1244.0 1219.6957 0.0 1219.6957 1219.6957 4.2167783 0.15534228 4.3689446 3.793606 0.012791872 3.280769109725952
|
| 4 |
+
2 1192.0 0.0 1192.0 1192.0 1250.1178 0.0 1250.1178 1250.1178 5.468623 1.3007789 6.996779 2.943526 -0.030620947 4.810173749923706
|
| 5 |
+
3 1205.0 0.0 1205.0 1205.0 1297.8342 0.0 1297.8342 1297.8342 5.799386 1.554889 7.896148 2.9416165 -0.048911247 6.327655553817749
|
| 6 |
+
4 1188.0 0.0 1188.0 1188.0 1315.5549 0.0 1315.5549 1315.5549 6.100899 1.7212788 8.686271 2.9031608 -0.06720509 7.8476622104644775
|
| 7 |
+
5 1243.0 0.0 1243.0 1243.0 1375.3137 0.0 1375.3137 1375.3137 6.257169 1.4943792 8.640024 3.4757495 -0.07026765 9.384979724884033
|
| 8 |
+
6 1240.0 0.0 1240.0 1240.0 1428.3319 0.0 1428.3319 1428.3319 6.543582 1.5338403 9.119177 3.7653043 -0.09917416 10.901644229888916
|
| 9 |
+
7 1228.0 0.0 1228.0 1228.0 1331.635 0.0 1331.635 1331.635 6.732708 1.736254 9.701538 3.9228978 -0.054717377 12.548632621765137
|
| 10 |
+
8 1204.0 0.0 1204.0 1204.0 1249.7778 0.0 1249.7778 1249.7778 6.362156 1.7360414 9.56274 3.5230036 -0.024297696 14.192672729492188
|
| 11 |
+
9 1239.0 0.0 1239.0 1239.0 1283.9503 0.0 1283.9503 1283.9503 5.9131517 1.8111537 9.319001 2.9190016 -0.023757637 15.83892273902893
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f926d5716d141a78ed669dbe7e5903f2e58bfbc84d7b6ce849cc70d870c3e52
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=10_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 908.0 0.0 908.0 908.0 968.69635 0.0 968.69635 968.69635 0.06582711 0.030821329 0.12859085 0.02594243 -0.06355667 1.7348337173461914
|
| 3 |
+
1 1206.0 0.0 1206.0 1206.0 1200.5833 0.0 1200.5833 1200.5833 3.96463 0.15318736 4.162917 3.481343 0.002712503 3.452739953994751
|
| 4 |
+
2 1176.0 0.0 1176.0 1176.0 1259.1947 0.0 1259.1947 1259.1947 5.2608776 1.4056866 7.1080832 2.923253 -0.04159731 5.1742284297943115
|
| 5 |
+
3 1176.0 0.0 1176.0 1176.0 1299.9003 0.0 1299.9003 1299.9003 5.5887127 1.6334538 8.155524 2.5881684 -0.061980933 6.89327335357666
|
| 6 |
+
4 1163.0 0.0 1163.0 1163.0 1316.5605 0.0 1316.5605 1316.5605 5.8823 1.817601 9.089848 3.1801522 -0.07681815 8.603352308273315
|
| 7 |
+
5 1213.0 0.0 1213.0 1213.0 1380.5156 0.0 1380.5156 1380.5156 6.0324545 1.678483 8.968804 3.3052797 -0.08392638 10.315141439437866
|
| 8 |
+
6 1194.0 0.0 1194.0 1194.0 1419.2574 0.0 1419.2574 1419.2574 6.266953 1.7976339 9.527894 3.4599137 -0.11262952 12.03567886352539
|
| 9 |
+
7 1204.0 0.0 1204.0 1204.0 1334.4447 0.0 1334.4447 1334.4447 6.5455937 1.9995801 10.066083 3.226369 -0.06522277 13.635676383972168
|
| 10 |
+
8 1174.0 0.0 1174.0 1174.0 1244.5249 0.0 1244.5249 1244.5249 6.0375304 1.9673376 9.803665 2.3823411 -0.035262793 15.218774318695068
|
| 11 |
+
9 1196.0 0.0 1196.0 1196.0 1267.0073 0.0 1267.0073 1267.0073 5.618536 2.104748 9.607915 1.7530874 -0.035503265 16.795999765396118
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:750e137edde21cfcedc166289ceb2706d6cc39b590fed3c959c24052311923c2
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=11_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 906.0 0.0 906.0 906.0 958.6794 0.0 958.6794 958.6794 0.06537555 0.03077103 0.1283747 0.025646895 -0.054931372 1.5906627178192139
|
| 3 |
+
1 1189.0 0.0 1189.0 1189.0 1162.9946 0.0 1162.9946 1162.9946 4.119972 0.13190477 4.279611 3.6784532 0.013054594 3.1784133911132812
|
| 4 |
+
2 1157.0 0.0 1157.0 1157.0 1224.7367 0.0 1224.7367 1224.7367 5.346582 1.2975943 6.915835 2.980411 -0.03386805 4.768067836761475
|
| 5 |
+
3 1155.0 0.0 1155.0 1155.0 1256.6157 0.0 1256.6157 1256.6157 5.710756 1.4902661 7.785035 3.0153704 -0.050858963 6.358244895935059
|
| 6 |
+
4 1132.0 0.0 1132.0 1132.0 1264.9797 0.0 1264.9797 1264.9797 5.9944754 1.6540933 8.606736 3.036939 -0.066723146 7.968702554702759
|
| 7 |
+
5 1173.0 0.0 1173.0 1173.0 1315.4581 0.0 1315.4581 1315.4581 6.1000853 1.4928354 8.567352 3.489823 -0.07180351 9.55355453491211
|
| 8 |
+
6 1166.0 0.0 1166.0 1166.0 1366.8982 0.0 1366.8982 1366.8982 6.3032246 1.5479369 8.995157 3.72458 -0.100600325 11.143269062042236
|
| 9 |
+
7 1182.0 0.0 1182.0 1182.0 1293.4285 0.0 1293.4285 1293.4285 6.5447054 1.7345475 9.620521 3.9211545 -0.055797532 12.874008893966675
|
| 10 |
+
8 1153.0 0.0 1153.0 1153.0 1204.4282 0.0 1204.4282 1204.4282 6.187322 1.7507019 9.490139 3.5125163 -0.025727488 14.590080976486206
|
| 11 |
+
9 1183.0 0.0 1183.0 1183.0 1229.5833 0.0 1229.5833 1229.5833 5.7720304 1.8804164 9.252505 2.8288438 -0.023292314 16.313095092773438
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9e2d0e2f93f26d1c4b2d401afc34829ef3078446ea1ead44cb81c1880c2ca29
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 912.0 0.0 912.0 912.0 973.66516 0.0 973.66516 973.66516 0.06393835 0.029945994 0.12872031 0.026120022 -0.06874615 1.6659510135650635
|
| 3 |
+
1 1192.0 0.0 1192.0 1192.0 1204.0017 0.0 1204.0017 1204.0017 4.139745 0.14927915 4.2879324 3.7306898 -0.00634329 3.3327438831329346
|
| 4 |
+
2 1165.0 0.0 1165.0 1165.0 1253.0822 0.0 1253.0822 1253.0822 5.338219 1.0354236 6.573024 3.4108663 -0.04635916 4.9872963428497314
|
| 5 |
+
3 1173.0 0.0 1173.0 1173.0 1311.4451 0.0 1311.4451 1311.4451 5.758373 1.4173946 7.6176085 3.1961422 -0.07294299 6.644782304763794
|
| 6 |
+
4 1149.0 0.0 1149.0 1149.0 1311.2649 0.0 1311.2649 1311.2649 6.1273785 1.4911681 8.362892 3.328421 -0.08571756 8.199853420257568
|
| 7 |
+
5 1192.0 0.0 1192.0 1192.0 1372.2527 0.0 1372.2527 1372.2527 6.2470493 1.3111086 8.337785 3.724815 -0.09501964 9.860314846038818
|
| 8 |
+
6 1189.0 0.0 1189.0 1189.0 1425.3804 0.0 1425.3804 1425.3804 6.468536 1.4719385 8.906117 3.7153807 -0.12441066 11.520072937011719
|
| 9 |
+
7 1192.0 0.0 1192.0 1192.0 1334.3293 0.0 1334.3293 1334.3293 6.7596803 1.6096861 9.523318 4.0959826 -0.074909404 13.168299198150635
|
| 10 |
+
8 1169.0 0.0 1169.0 1169.0 1250.5563 0.0 1250.5563 1250.5563 6.362063 1.5924534 9.402348 3.694228 -0.042925037 14.82404899597168
|
| 11 |
+
9 1179.0 0.0 1179.0 1179.0 1268.1361 0.0 1268.1361 1268.1361 5.868972 1.6910975 9.0989685 2.9728293 -0.046914358 16.52371883392334
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8610425fd037b583a8c697e204a614bf27ca71d58388803de05163f51d75ddd
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 953.0 0.0 953.0 953.0 983.2959 0.0 983.2959 983.2959 0.06088065 0.029098347 0.11947158 0.027638376 -0.037127502 1.4292283058166504
|
| 3 |
+
1 1193.0 0.0 1193.0 1193.0 1152.4028 0.0 1152.4028 1152.4028 4.0307956 0.1967857 4.231489 3.6537817 0.027504958 2.8551692962646484
|
| 4 |
+
2 1193.0 0.0 1193.0 1193.0 1207.2128 0.0 1207.2128 1207.2128 4.9806504 1.2189851 6.4102397 3.1584384 -0.012678631 4.28946328163147
|
| 5 |
+
3 1223.0 0.0 1223.0 1223.0 1275.0652 0.0 1275.0652 1275.0652 5.484776 1.4145527 7.2994614 3.3080153 -0.039774604 5.7326319217681885
|
| 6 |
+
4 1151.0 0.0 1151.0 1151.0 1218.8317 0.0 1218.8317 1218.8317 5.8252735 1.603229 8.059538 3.15971 -0.05374962 7.161067485809326
|
| 7 |
+
5 1192.0 0.0 1192.0 1192.0 1267.9004 0.0 1267.9004 1267.9004 5.750593 1.4211072 8.039577 3.4274483 -0.0637282 8.59539008140564
|
| 8 |
+
6 1192.0 0.0 1192.0 1192.0 1317.8253 0.0 1317.8253 1317.8253 5.8999863 1.667073 8.666302 3.2965572 -0.09348099 10.133167505264282
|
| 9 |
+
7 1204.0 0.0 1204.0 1204.0 1265.6321 0.0 1265.6321 1265.6321 6.1705256 1.8438786 9.165756 3.4471583 -0.04247594 11.674520492553711
|
| 10 |
+
8 1178.0 0.0 1178.0 1178.0 1193.7365 0.0 1193.7365 1193.7365 5.86707 1.7104177 8.922114 3.2833862 -0.010890298 13.209067583084106
|
| 11 |
+
9 1219.0 0.0 1219.0 1219.0 1239.4601 0.0 1239.4601 1239.4601 5.57733 1.586236 8.602832 3.1637225 -0.013994768 14.741300821304321
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1faa7611bcc1bb9a37a4642e5d0d4789a990cc739d68c11848c2a1c3f4f0565
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 920.0 0.0 920.0 920.0 972.98444 0.0 972.98444 972.98444 0.065948814 0.030870939 0.12837547 0.025647953 -0.05496287 1.738675594329834
|
| 3 |
+
1 1192.0 0.0 1192.0 1192.0 1171.1571 0.0 1171.1571 1171.1571 4.2092886 0.13942103 4.375939 3.7525601 0.010437354 3.4684016704559326
|
| 4 |
+
2 1184.0 0.0 1184.0 1184.0 1249.9778 0.0 1249.9778 1249.9778 5.4445496 1.3619596 7.0394816 2.9952383 -0.03298798 5.193624019622803
|
| 5 |
+
3 1183.0 0.0 1183.0 1183.0 1285.2948 0.0 1285.2948 1285.2948 5.848812 1.5783962 7.952702 3.0170097 -0.05119887 6.919215202331543
|
| 6 |
+
4 1153.0 0.0 1153.0 1153.0 1290.8324 0.0 1290.8324 1290.8324 6.118179 1.7235568 8.697647 3.062007 -0.06929724 8.513078451156616
|
| 7 |
+
5 1200.0 0.0 1200.0 1200.0 1346.4 0.0 1346.4 1346.4 6.2196054 1.5467654 8.623663 3.501527 -0.07382712 10.090184688568115
|
| 8 |
+
6 1186.0 0.0 1186.0 1186.0 1391.2561 0.0 1391.2561 1391.2561 6.437819 1.6424723 9.101392 3.6879182 -0.10267923 11.666984796524048
|
| 9 |
+
7 1219.0 0.0 1219.0 1219.0 1328.8165 0.0 1328.8165 1328.8165 6.672976 1.8210331 9.679336 3.9335535 -0.055046003 13.248085021972656
|
| 10 |
+
8 1188.0 0.0 1188.0 1188.0 1239.899 0.0 1239.899 1239.899 6.3292365 1.813252 9.473634 3.4842882 -0.02596265 14.83223295211792
|
| 11 |
+
9 1208.0 0.0 1208.0 1208.0 1260.478 0.0 1260.478 1260.478 5.9101896 1.9121094 9.200022 2.8472924 -0.026239026 16.412571668624878
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2708bfc2038bfab5a48a789cf8ae5d799d59293f030e278d1751fa29aaa0b87
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 923.0 0.0 923.0 923.0 983.7524 0.0 983.7524 983.7524 0.061607245 0.029617704 0.12877157 0.026190445 -0.070806205 1.5106761455535889
|
| 3 |
+
1 1166.0 0.0 1166.0 1166.0 1181.085 0.0 1181.085 1181.085 4.0912137 0.16223936 4.26049 3.730615 -0.008407839 3.0113251209259033
|
| 4 |
+
2 1173.0 0.0 1173.0 1173.0 1262.7911 0.0 1262.7911 1262.7911 5.1378536 1.1916949 6.6134205 3.2768438 -0.049884103 4.5416259765625
|
| 5 |
+
3 1167.0 0.0 1167.0 1167.0 1307.823 0.0 1307.823 1307.823 5.674875 1.5102973 7.664962 3.2637599 -0.07827811 6.047931671142578
|
| 6 |
+
4 1120.0 0.0 1120.0 1120.0 1276.14 0.0 1276.14 1276.14 6.021316 1.6237295 8.462135 3.3806243 -0.08674408 7.546782732009888
|
| 7 |
+
5 1192.0 0.0 1192.0 1192.0 1371.3181 0.0 1371.3181 1371.3181 6.0253954 1.4721338 8.3983345 3.6176198 -0.099675745 9.132035493850708
|
| 8 |
+
6 1163.0 0.0 1163.0 1163.0 1394.38 0.0 1394.38 1394.38 6.4074035 1.5698775 9.042046 3.8589818 -0.12854391 10.744093418121338
|
| 9 |
+
7 1175.0 0.0 1175.0 1175.0 1316.3539 0.0 1316.3539 1316.3539 6.6073084 1.7188287 9.598959 4.124531 -0.078530006 12.35179853439331
|
| 10 |
+
8 1154.0 0.0 1154.0 1154.0 1237.8258 0.0 1237.8258 1237.8258 6.241708 1.8021115 9.602525 3.5921843 -0.04657021 13.966685771942139
|
| 11 |
+
9 1177.0 0.0 1177.0 1177.0 1266.8389 0.0 1266.8389 1266.8389 5.706153 1.8605907 9.218033 2.9221117 -0.04990985 15.57736611366272
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04bdae8b27e75a824d9c2f629ba7b44e778cb33328363746e32cf0b2b0acb976
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 987.0 0.0 987.0 987.0 1012.9715 0.0 1012.9715 1012.9715 0.21154436 0.041003454 0.27913898 0.15464641 -0.02079381 1.6853346824645996
|
| 3 |
+
1 1136.0 0.0 1136.0 1136.0 1141.974 0.0 1141.974 1141.974 4.2904053 0.35412526 4.750295 3.4774776 -0.0031471103 3.352159023284912
|
| 4 |
+
2 1092.0 0.0 1092.0 1092.0 1157.4108 0.0 1157.4108 1157.4108 5.0475383 1.343021 6.924373 2.7745128 -0.034463406 5.018894195556641
|
| 5 |
+
3 1102.0 0.0 1102.0 1102.0 1138.6979 0.0 1138.6979 1138.6979 5.2399426 1.4962304 7.4054785 2.501412 -0.019529685 6.578514575958252
|
| 6 |
+
4 1089.0 0.0 1089.0 1089.0 1125.1641 0.0 1125.1641 1125.1641 5.174271 1.5561018 7.5064106 2.2210414 -0.019033745 8.117218971252441
|
| 7 |
+
5 1121.0 0.0 1121.0 1121.0 1162.4714 0.0 1162.4714 1162.4714 5.076506 1.6752964 7.6898804 2.4245434 -0.021839365 9.656955003738403
|
| 8 |
+
6 1150.0 0.0 1150.0 1150.0 1201.6523 0.0 1201.6523 1201.6523 5.1883826 1.7504545 8.211736 2.6632872 -0.027199477 11.20093560218811
|
| 9 |
+
7 1099.0 0.0 1099.0 1099.0 1228.1823 0.0 1228.1823 1228.1823 5.419756 1.7741109 8.628821 2.0804408 -0.06799051 12.742582082748413
|
| 10 |
+
8 1120.0 0.0 1120.0 1120.0 1194.6515 0.0 1194.6515 1194.6515 5.6818314 1.529158 8.465559 2.6507297 -0.039353177 14.2914719581604
|
| 11 |
+
9 1136.0 0.0 1136.0 1136.0 1133.9075 0.0 1133.9075 1133.9075 5.4949574 1.8131995 8.767371 1.9788646 0.0011012182 15.832674503326416
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed2c4d1f1345128855db81c46bb2d3066984d62eb630771d20a1aef0880b5ec1
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=1_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:770168b3aaef05c84af851d3036d265dcee4f037db63d5c1823616342f1a4a47
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 951.0 0.0 951.0 951.0 976.8953 0.0 976.8953 976.8953 0.06241772 0.03056342 0.1277354 0.02478075 -0.029730119 1.6409080028533936
|
| 3 |
+
1 1214.0 0.0 1214.0 1214.0 1150.9373 0.0 1150.9373 1150.9373 4.087099 0.19205798 4.2850094 3.6689117 0.035329178 3.2533345222473145
|
| 4 |
+
2 1205.0 0.0 1205.0 1205.0 1216.1172 0.0 1216.1172 1216.1172 5.089922 1.4271455 6.8031816 2.8130212 -0.0062813237 4.876632213592529
|
| 5 |
+
3 1199.0 0.0 1199.0 1199.0 1246.0989 0.0 1246.0989 1246.0989 5.5095453 1.6543297 7.7526712 2.886612 -0.027367193 6.432351589202881
|
| 6 |
+
4 1187.0 0.0 1187.0 1187.0 1264.0752 0.0 1264.0752 1264.0752 5.770391 1.8019516 8.518605 2.8202922 -0.04576904 7.927778005599976
|
| 7 |
+
5 1194.0 0.0 1194.0 1194.0 1277.6978 0.0 1277.6978 1277.6978 5.96397 1.556893 8.4700165 3.4647555 -0.05066451 9.41650390625
|
| 8 |
+
6 1202.0 0.0 1202.0 1202.0 1344.3875 0.0 1344.3875 1344.3875 6.035596 1.7529807 8.973807 3.3102748 -0.08044559 10.904433965682983
|
| 9 |
+
7 1225.0 0.0 1225.0 1225.0 1281.0114 0.0 1281.0114 1281.0114 6.247897 1.968946 9.541765 3.5399778 -0.031752802 12.402732610702515
|
| 10 |
+
8 1236.0 0.0 1236.0 1236.0 1238.743 0.0 1238.743 1238.743 5.89419 1.8811383 9.255002 3.2155774 -0.0015451908 13.89477801322937
|
| 11 |
+
9 1217.0 0.0 1217.0 1217.0 1222.1251 0.0 1222.1251 1222.1251 5.623561 1.9753083 9.158954 2.7347083 -0.0029309243 15.411056995391846
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a25ced2c4ff4f6e6cb51162cb61c5c6c97916c59e86ee7e25aa0b13c75dab767
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 1002.0 0.0 1002.0 1002.0 1070.5034 0.0 1070.5034 1070.5034 0.22323427 0.045061756 0.2803741 0.15546012 -0.06542736 1.5466432571411133
|
| 3 |
+
1 1147.0 0.0 1147.0 1147.0 1222.0647 0.0 1222.0647 1222.0647 4.5255995 0.36485848 4.9482393 3.9306602 -0.046974108 3.071249485015869
|
| 4 |
+
2 1153.0 0.0 1153.0 1153.0 1276.2467 0.0 1276.2467 1276.2467 5.186043 1.427025 7.078469 3.1816862 -0.07731922 4.598511695861816
|
| 5 |
+
3 1146.0 0.0 1146.0 1146.0 1244.5114 0.0 1244.5114 1244.5114 5.5217695 1.9571221 8.18985 2.5215247 -0.06160903 6.129634618759155
|
| 6 |
+
4 1152.0 0.0 1152.0 1152.0 1251.0724 0.0 1251.0724 1251.0724 5.328388 1.8464293 7.959303 2.3591478 -0.06192036 7.659305095672607
|
| 7 |
+
5 1159.0 0.0 1159.0 1159.0 1258.4625 0.0 1258.4625 1258.4625 5.24099 2.155841 8.348679 1.7706525 -0.062163606 9.185559034347534
|
| 8 |
+
6 1176.0 0.0 1176.0 1176.0 1289.4347 0.0 1289.4347 1289.4347 5.3775735 2.177179 8.727808 1.7319336 -0.07094137 10.71433687210083
|
| 9 |
+
7 1161.0 0.0 1161.0 1161.0 1334.8282 0.0 1334.8282 1334.8282 5.579647 2.0350485 8.798765 2.0514455 -0.10864286 12.247443914413452
|
| 10 |
+
8 1177.0 0.0 1177.0 1177.0 1302.4358 0.0 1302.4358 1302.4358 5.961232 1.9984908 9.095709 2.3366942 -0.07839759 13.774472713470459
|
| 11 |
+
9 1176.0 0.0 1176.0 1176.0 1241.5043 0.0 1241.5043 1241.5043 5.6641784 2.2364795 9.267008 1.6431377 -0.04094121 15.301223039627075
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:502445c15f6ace5c920ef6d4e9fff606bc55b5e1875fe2ac2c314b7f5319f773
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=2_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:770168b3aaef05c84af851d3036d265dcee4f037db63d5c1823616342f1a4a47
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 930.0 0.0 930.0 930.0 992.2273 0.0 992.2273 992.2273 0.06651514 0.030768508 0.12862921 0.025994942 -0.06509103 1.7421948909759521
|
| 3 |
+
1 1231.0 0.0 1231.0 1231.0 1232.3569 0.0 1232.3569 1232.3569 4.2291107 0.13509724 4.373209 3.7645724 -0.00067947805 3.4568123817443848
|
| 4 |
+
2 1204.0 0.0 1204.0 1204.0 1288.5216 0.0 1288.5216 1288.5216 5.606352 1.2835276 7.0406475 3.1012685 -0.042260982 5.172529458999634
|
| 5 |
+
3 1206.0 0.0 1206.0 1206.0 1333.481 0.0 1333.481 1333.481 5.9853964 1.4935832 7.929003 3.1565397 -0.06380397 6.842583656311035
|
| 6 |
+
4 1161.0 0.0 1161.0 1161.0 1321.4769 0.0 1321.4769 1321.4769 6.288762 1.6507521 8.739389 3.1553829 -0.08068189 8.510520458221436
|
| 7 |
+
5 1221.0 0.0 1221.0 1221.0 1393.4319 0.0 1393.4319 1393.4319 6.378141 1.4993801 8.714547 3.6088455 -0.086867586 10.186025381088257
|
| 8 |
+
6 1220.0 0.0 1220.0 1220.0 1452.1389 0.0 1452.1389 1452.1389 6.6079187 1.6396201 9.244006 3.6715333 -0.116127804 11.862547636032104
|
| 9 |
+
7 1232.0 0.0 1232.0 1232.0 1366.3013 0.0 1366.3013 1366.3013 6.905231 1.7877018 9.831878 4.039462 -0.06721743 13.5599946975708
|
| 10 |
+
8 1205.0 0.0 1205.0 1205.0 1278.6427 0.0 1278.6427 1278.6427 6.4886374 1.7435365 9.595183 3.6689155 -0.03698823 15.25812029838562
|
| 11 |
+
9 1227.0 0.0 1227.0 1227.0 1305.3923 0.0 1305.3923 1305.3923 6.0412135 1.8536057 9.321296 2.9326897 -0.03919537 16.9726300239563
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d24e32e915146e074b207e0b1fa6f84dd96c4ccc0fa70ee2405ea3a67506e870
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 988.0 0.0 988.0 988.0 1003.2184 0.0 1003.2184 1003.2184 0.2133365 0.042809114 0.27891508 0.15449677 -0.012745604 1.6281647682189941
|
| 3 |
+
1 1170.0 0.0 1170.0 1170.0 1161.4623 0.0 1161.4623 1161.4623 4.220183 0.400415 4.685703 3.3988972 0.00475125 3.246513843536377
|
| 4 |
+
2 1113.0 0.0 1113.0 1113.0 1167.7142 0.0 1167.7142 1167.7142 5.078326 1.2833967 6.7664523 2.9952528 -0.03044796 4.792450428009033
|
| 5 |
+
3 1117.0 0.0 1117.0 1117.0 1140.8434 0.0 1140.8434 1140.8434 5.2304974 1.6317452 7.4960375 2.5677817 -0.013261095 6.334895372390747
|
| 6 |
+
4 1147.0 0.0 1147.0 1147.0 1166.5417 0.0 1166.5417 1166.5417 5.1616526 1.5522047 7.4084687 2.4282608 -0.010880858 7.845405101776123
|
| 7 |
+
5 1141.0 0.0 1141.0 1141.0 1168.0166 0.0 1168.0166 1168.0166 5.138826 1.8236151 7.885619 1.9572355 -0.015017942 9.351108312606812
|
| 8 |
+
6 1156.0 0.0 1156.0 1156.0 1193.2911 0.0 1193.2911 1193.2911 5.23483 1.8714991 8.386953 1.9658835 -0.020728558 10.910987138748169
|
| 9 |
+
7 1113.0 0.0 1113.0 1113.0 1218.3712 0.0 1218.3712 1218.3712 5.4298606 1.7760464 8.481021 2.3338308 -0.058539763 12.693541526794434
|
| 10 |
+
8 1147.0 0.0 1147.0 1147.0 1204.4265 0.0 1204.4265 1204.4265 5.6730704 1.6515126 8.560489 2.7388594 -0.0319214 14.227595567703247
|
| 11 |
+
9 1169.0 0.0 1169.0 1169.0 1152.675 0.0 1152.675 1152.675 5.4589467 1.9669291 8.87189 2.100496 0.009069063 15.759260892868042
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c2a395d0a9ffb629d02abe23c1033cfb74fa6e552b6edd392a815d7bf939520
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=3_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:770168b3aaef05c84af851d3036d265dcee4f037db63d5c1823616342f1a4a47
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 908.0 0.0 908.0 908.0 925.8427 0.0 925.8427 925.8427 0.061079234 0.029705958 0.12747869 0.024436295 -0.019737348 1.6845595836639404
|
| 3 |
+
1 1163.0 0.0 1163.0 1163.0 1082.6565 0.0 1082.6565 1082.6565 3.8942513 0.14911747 4.0687084 3.5044916 0.04630725 3.3590328693389893
|
| 4 |
+
2 1165.0 0.0 1165.0 1165.0 1157.9706 0.0 1157.9706 1157.9706 4.856373 1.1185611 6.2661934 2.994666 0.004775353 5.036845922470093
|
| 5 |
+
3 1193.0 0.0 1193.0 1193.0 1221.1901 0.0 1221.1901 1221.1901 5.3410945 1.3930454 7.257123 2.9381623 -0.021227285 6.598391771316528
|
| 6 |
+
4 1160.0 0.0 1160.0 1160.0 1200.978 0.0 1200.978 1200.978 5.691611 1.5363562 8.079082 2.9929485 -0.035726305 8.134608030319214
|
| 7 |
+
5 1167.0 0.0 1167.0 1167.0 1216.8624 0.0 1216.8624 1216.8624 5.6843405 1.4334729 8.203323 3.2916589 -0.043358482 9.671580076217651
|
| 8 |
+
6 1169.0 0.0 1169.0 1169.0 1261.4766 0.0 1261.4766 1261.4766 5.7206373 1.5606426 8.596225 3.244196 -0.07345247 11.205826759338379
|
| 9 |
+
7 1163.0 0.0 1163.0 1163.0 1198.2916 0.0 1198.2916 1198.2916 5.862975 1.7796805 9.283429 3.3218791 -0.02506505 12.74873685836792
|
| 10 |
+
8 1207.0 0.0 1207.0 1207.0 1196.7089 0.0 1196.7089 1196.7089 5.5816116 1.6990546 9.147678 3.0907478 0.0077963695 14.318079948425293
|
| 11 |
+
9 1196.0 0.0 1196.0 1196.0 1187.7532 0.0 1187.7532 1187.7532 5.5002346 1.5639231 8.950281 3.188693 0.005648352 16.10502529144287
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:542de518ac08ce56985b150774a65d60d28a083aed67723ac84613fe17d4bfa3
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f946fe6c9a728a7abe8d3928ea8cd68bcfcb39b4de86e58100105f2db062d6
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 996.0 0.0 996.0 996.0 1042.4347 0.0 1042.4347 1042.4347 0.2230201 0.044851135 0.27978066 0.15507168 -0.043930635 1.5171842575073242
|
| 3 |
+
1 1152.0 0.0 1152.0 1152.0 1196.2231 0.0 1196.2231 1196.2231 4.0933585 0.274151 4.457058 3.646826 -0.027657494 3.019925117492676
|
| 4 |
+
2 1119.0 0.0 1119.0 1119.0 1214.9153 0.0 1214.9153 1214.9153 4.7705784 1.2670809 6.8144627 3.2446218 -0.06136644 4.522210597991943
|
| 5 |
+
3 1119.0 0.0 1119.0 1119.0 1186.1375 0.0 1186.1375 1186.1375 5.1090803 1.3264626 7.5319605 3.382184 -0.04196024 6.0225465297698975
|
| 6 |
+
4 1145.0 0.0 1145.0 1145.0 1211.3746 0.0 1211.3746 1211.3746 5.119468 1.2100283 7.495699 3.4305665 -0.04148437 7.527385234832764
|
| 7 |
+
5 1138.0 0.0 1138.0 1138.0 1205.8164 0.0 1205.8164 1205.8164 5.169105 1.4672385 8.194489 3.084612 -0.04241173 9.02845573425293
|
| 8 |
+
6 1143.0 0.0 1143.0 1143.0 1222.9315 0.0 1222.9315 1222.9315 5.141478 1.5491165 8.808318 3.202721 -0.04998894 10.53096079826355
|
| 9 |
+
7 1148.0 0.0 1148.0 1148.0 1290.3949 0.0 1290.3949 1290.3949 5.206814 1.4783621 8.751904 3.565569 -0.08899681 12.03333592414856
|
| 10 |
+
8 1164.0 0.0 1164.0 1164.0 1258.1008 0.0 1258.1008 1258.1008 5.7222023 1.4749635 9.2217655 4.0578647 -0.058886528 13.533396244049072
|
| 11 |
+
9 1152.0 0.0 1152.0 1152.0 1185.0465 0.0 1185.0465 1185.0465 5.5298553 1.65695 9.349673 3.5494692 -0.020718813 15.03360891342163
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8841f5982c2075b2b95eb57d617e63fe7ed7a64ef429c4b1a6049258bc550d92
|
| 3 |
+
size 26198
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=4_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s13/vars.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:770168b3aaef05c84af851d3036d265dcee4f037db63d5c1823616342f1a4a47
|
| 3 |
+
size 13916
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/progress.txt
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time
|
| 2 |
+
0 933.0 0.0 933.0 933.0 972.8293 0.0 972.8293 972.8293 0.060133453 0.028405845 0.11186355 0.025366038 -0.046748422 1.5428578853607178
|
| 3 |
+
1 1151.0 0.0 1151.0 1151.0 1124.7109 0.0 1124.7109 1124.7109 3.991683 0.14392135 4.1472416 3.6653965 0.014662422 3.1322968006134033
|
| 4 |
+
2 1136.0 0.0 1136.0 1136.0 1178.2677 0.0 1178.2677 1178.2677 4.8533726 1.0239773 6.062337 3.23256 -0.023481652 4.75055718421936
|
| 5 |
+
3 1144.0 0.0 1144.0 1144.0 1240.7239 0.0 1240.7239 1240.7239 5.2947874 1.3103068 6.942222 3.1439362 -0.0537657 6.362165689468384
|
| 6 |
+
4 1118.0 0.0 1118.0 1118.0 1234.6378 0.0 1234.6378 1234.6378 5.6339197 1.3796512 7.5465717 3.176712 -0.0647982 7.969565391540527
|
| 7 |
+
5 1160.0 0.0 1160.0 1160.0 1297.3956 0.0 1297.3956 1297.3956 5.7473044 1.272676 7.6536417 3.438048 -0.07637345 9.57076358795166
|
| 8 |
+
6 1135.0 0.0 1135.0 1135.0 1324.5988 0.0 1324.5988 1324.5988 6.0181847 1.3489273 8.172247 3.5578313 -0.10533208 11.170955181121826
|
| 9 |
+
7 1161.0 0.0 1161.0 1161.0 1258.4978 0.0 1258.4978 1258.4978 6.210946 1.4776 8.68286 3.811021 -0.054165907 12.769633293151855
|
| 10 |
+
8 1142.0 0.0 1142.0 1142.0 1181.2092 0.0 1181.2092 1181.2092 5.8233175 1.444846 8.582061 3.3962119 -0.021783322 14.362510204315186
|
| 11 |
+
9 1159.0 0.0 1159.0 1159.0 1207.5348 0.0 1207.5348 1207.5348 5.3827343 1.5257895 8.313026 2.7265518 -0.026963346 15.95551872253418
|
reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707780024.4380288_rfbase_cotTrue_task_index=5_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s12/pyt_save/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:110807ff0011316c829c91837112ce924b1c99c8e3614b4eb1c83f6629b4d797
|
| 3 |
+
size 26198
|