Upload folder using huggingface_hub
Browse files- teaching_arithmetic/out/addition_plain/addition_plain/config.yaml +2 -2
- teaching_arithmetic/out/addition_plain/addition_plain/result.csv +20 -20
- teaching_arithmetic/out/addition_plain/ckpt_10000.pt +1 -1
- teaching_arithmetic/out/addition_plain/ckpt_10000_acc.pt +1 -1
- teaching_arithmetic/out/addition_plain/ckpt_10000_final.pt +1 -1
teaching_arithmetic/out/addition_plain/addition_plain/config.yaml
CHANGED
@@ -71,8 +71,8 @@ use_lora: false
|
|
71 |
val_data_path: val.bin
|
72 |
val_data_path2: val_addition.bin
|
73 |
vocabulary: all_ascii_chars
|
74 |
-
wandb_entity:
|
75 |
-
wandb_log:
|
76 |
wandb_project: addition
|
77 |
wandb_run_name: addition_plain
|
78 |
warmup_iters: 100
|
|
|
71 |
val_data_path: val.bin
|
72 |
val_data_path2: val_addition.bin
|
73 |
vocabulary: all_ascii_chars
|
74 |
+
wandb_entity: ''
|
75 |
+
wandb_log: true
|
76 |
wandb_project: addition
|
77 |
wandb_run_name: addition_plain
|
78 |
warmup_iters: 100
|
teaching_arithmetic/out/addition_plain/addition_plain/result.csv
CHANGED
@@ -1,22 +1,22 @@
|
|
1 |
iter,train_loss,val_loss,val_ppl,test_acc,train_acc,test_acc_ar,test_acc_other
|
2 |
0,4.558201789855957,4.557050704956055,,0.0,0.0,,
|
3 |
-
250,1.
|
4 |
-
500,1.
|
5 |
-
750,1.
|
6 |
-
1000,1.
|
7 |
-
1250,0.
|
8 |
-
1500,0.
|
9 |
-
1750,0.
|
10 |
-
2000,0.
|
11 |
-
2250,0.
|
12 |
-
2500,0.
|
13 |
-
2750,0.
|
14 |
-
3000,0.
|
15 |
-
3250,0.
|
16 |
-
3500,0.
|
17 |
-
3750,0.
|
18 |
-
4000,0.
|
19 |
-
4250,0.
|
20 |
-
4500,0.
|
21 |
-
4750,0.
|
22 |
-
5000,0.
|
|
|
1 |
iter,train_loss,val_loss,val_ppl,test_acc,train_acc,test_acc_ar,test_acc_other
|
2 |
0,4.558201789855957,4.557050704956055,,0.0,0.0,,
|
3 |
+
250,1.727452039718628,1.7128900289535522,,0.09090909090909091,0.21,,
|
4 |
+
500,1.3982913494110107,1.4006158113479614,,6.424242424242424,7.04,,
|
5 |
+
750,1.2016884088516235,1.2032077312469482,,61.84848484848485,56.75,,
|
6 |
+
1000,1.1120785474777222,1.201298475265503,,78.11111111111111,75.41,,
|
7 |
+
1250,0.510977029800415,1.6772781610488892,,83.98989898989899,79.85,,
|
8 |
+
1500,0.08414328843355179,3.0158331394195557,,85.12121212121212,81.81,,
|
9 |
+
1750,0.07066360116004944,3.628917932510376,,86.67676767676767,83.46000000000001,,
|
10 |
+
2000,0.06547190994024277,3.9166698455810547,,87.80808080808082,84.76,,
|
11 |
+
2250,0.0619925819337368,4.123533725738525,,87.43434343434343,84.71,,
|
12 |
+
2500,0.059753164649009705,4.269007205963135,,87.5050505050505,86.29,,
|
13 |
+
2750,0.05738186836242676,4.358820915222168,,88.01010101010101,86.11,,
|
14 |
+
3000,0.055332522839307785,4.551158905029297,,88.05050505050505,86.55000000000001,,
|
15 |
+
3250,0.05387099087238312,4.602115631103516,,87.72727272727273,85.84,,
|
16 |
+
3500,0.05256320536136627,4.660210609436035,,87.70707070707071,85.7,,
|
17 |
+
3750,0.05127747356891632,4.75046443939209,,88.24242424242425,86.33,,
|
18 |
+
4000,0.05036056414246559,4.851500511169434,,87.98989898989899,87.08,,
|
19 |
+
4250,0.049514856189489365,4.912571907043457,,88.22222222222223,86.94,,
|
20 |
+
4500,0.04892862215638161,4.902630805969238,,88.28282828282829,87.07000000000001,,
|
21 |
+
4750,0.04843810200691223,4.9761247634887695,,88.35353535353535,87.5,,
|
22 |
+
5000,0.048013366758823395,5.004452228546143,,88.20202020202021,87.11,,
|
teaching_arithmetic/out/addition_plain/ckpt_10000.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 129138715
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91a33d4ed5ed61168a720418fc42627611b7dde6bcf5fe6c405cb54435261319
|
3 |
size 129138715
|
teaching_arithmetic/out/addition_plain/ckpt_10000_acc.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 129139359
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f72ed2793d7d45dc5e8c1743e557aa75ff44bd7fafd94229dfa00e6fd956271
|
3 |
size 129139359
|
teaching_arithmetic/out/addition_plain/ckpt_10000_final.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 129139681
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:935c8a7654c307c1b6cdf68d6b6686f70eaa04b2bde08c15ebaa1427bda51601
|
3 |
size 129139681
|