meg HF staff commited on
Commit
d44c767
·
verified ·
1 Parent(s): 270efc6

Upload folder using huggingface_hub

Browse files
teaching_arithmetic/out/addition_plain/addition_plain/config.yaml CHANGED
@@ -71,8 +71,8 @@ use_lora: false
71
  val_data_path: val.bin
72
  val_data_path2: val_addition.bin
73
  vocabulary: all_ascii_chars
74
- wandb_entity: ssdd
75
- wandb_log: false
76
  wandb_project: addition
77
  wandb_run_name: addition_plain
78
  warmup_iters: 100
 
71
  val_data_path: val.bin
72
  val_data_path2: val_addition.bin
73
  vocabulary: all_ascii_chars
74
+ wandb_entity: ''
75
+ wandb_log: true
76
  wandb_project: addition
77
  wandb_run_name: addition_plain
78
  warmup_iters: 100
teaching_arithmetic/out/addition_plain/addition_plain/result.csv CHANGED
@@ -1,22 +1,22 @@
1
  iter,train_loss,val_loss,val_ppl,test_acc,train_acc,test_acc_ar,test_acc_other
2
  0,4.558201789855957,4.557050704956055,,0.0,0.0,,
3
- 250,1.7286615371704102,1.7170720100402832,,0.0707070707070707,0.16999999999999998,,
4
- 500,1.4398878812789917,1.4310863018035889,,5.434343434343434,5.96,,
5
- 750,1.2331775426864624,1.2203372716903687,,73.54545454545455,67.83,,
6
- 1000,1.1358768939971924,1.2272201776504517,,75.29292929292929,70.32000000000001,,
7
- 1250,0.5539495348930359,1.7250535488128662,,77.78787878787878,73.18,,
8
- 1500,0.1001376137137413,2.863405227661133,,78.0,74.55000000000001,,
9
- 1750,0.07596367597579956,3.4369161128997803,,78.83838383838383,77.46,,
10
- 2000,0.06951306015253067,3.724381685256958,,78.57575757575758,78.39,,
11
- 2250,0.06603887677192688,3.890638828277588,,79.06060606060606,78.68,,
12
- 2500,0.06290150433778763,3.9894931316375732,,79.94949494949495,82.75,,
13
- 2750,0.06049436703324318,4.099140167236328,,80.77777777777779,81.78,,
14
- 3000,0.05838387832045555,4.249746322631836,,80.53535353535354,83.32000000000001,,
15
- 3250,0.057155631482601166,4.353604316711426,,81.17171717171718,83.25,,
16
- 3500,0.055782441049814224,4.412276268005371,,81.0,83.96000000000001,,
17
- 3750,0.054552655667066574,4.499052047729492,,81.4040404040404,84.98,,
18
- 4000,0.053756218403577805,4.524080276489258,,80.96969696969697,85.02,,
19
- 4250,0.05292206257581711,4.601434707641602,,81.5050505050505,84.89,,
20
- 4500,0.052253320813179016,4.638243675231934,,81.73737373737374,85.17,,
21
- 4750,0.0518411286175251,4.682107448577881,,81.43434343434343,85.61,,
22
- 5000,0.051410287618637085,4.731619358062744,,81.51515151515152,86.03,,
 
1
  iter,train_loss,val_loss,val_ppl,test_acc,train_acc,test_acc_ar,test_acc_other
2
  0,4.558201789855957,4.557050704956055,,0.0,0.0,,
3
+ 250,1.727452039718628,1.7128900289535522,,0.09090909090909091,0.21,,
4
+ 500,1.3982913494110107,1.4006158113479614,,6.424242424242424,7.04,,
5
+ 750,1.2016884088516235,1.2032077312469482,,61.84848484848485,56.75,,
6
+ 1000,1.1120785474777222,1.201298475265503,,78.11111111111111,75.41,,
7
+ 1250,0.510977029800415,1.6772781610488892,,83.98989898989899,79.85,,
8
+ 1500,0.08414328843355179,3.0158331394195557,,85.12121212121212,81.81,,
9
+ 1750,0.07066360116004944,3.628917932510376,,86.67676767676767,83.46000000000001,,
10
+ 2000,0.06547190994024277,3.9166698455810547,,87.80808080808082,84.76,,
11
+ 2250,0.0619925819337368,4.123533725738525,,87.43434343434343,84.71,,
12
+ 2500,0.059753164649009705,4.269007205963135,,87.5050505050505,86.29,,
13
+ 2750,0.05738186836242676,4.358820915222168,,88.01010101010101,86.11,,
14
+ 3000,0.055332522839307785,4.551158905029297,,88.05050505050505,86.55000000000001,,
15
+ 3250,0.05387099087238312,4.602115631103516,,87.72727272727273,85.84,,
16
+ 3500,0.05256320536136627,4.660210609436035,,87.70707070707071,85.7,,
17
+ 3750,0.05127747356891632,4.75046443939209,,88.24242424242425,86.33,,
18
+ 4000,0.05036056414246559,4.851500511169434,,87.98989898989899,87.08,,
19
+ 4250,0.049514856189489365,4.912571907043457,,88.22222222222223,86.94,,
20
+ 4500,0.04892862215638161,4.902630805969238,,88.28282828282829,87.07000000000001,,
21
+ 4750,0.04843810200691223,4.9761247634887695,,88.35353535353535,87.5,,
22
+ 5000,0.048013366758823395,5.004452228546143,,88.20202020202021,87.11,,
teaching_arithmetic/out/addition_plain/ckpt_10000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b6e21682cc49d528b55dd0b7569ffedb9f5a259f20fb30faddc983c6cfedf05
3
  size 129138715
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91a33d4ed5ed61168a720418fc42627611b7dde6bcf5fe6c405cb54435261319
3
  size 129138715
teaching_arithmetic/out/addition_plain/ckpt_10000_acc.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac751f03da9a54a32944b82532d2530352c89f6e23e7f53c5933c4697b29e685
3
  size 129139359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f72ed2793d7d45dc5e8c1743e557aa75ff44bd7fafd94229dfa00e6fd956271
3
  size 129139359
teaching_arithmetic/out/addition_plain/ckpt_10000_final.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b02d470faa1df8f459c2b19670e716be7f44db1a4243b604585ce57648f1c94e
3
  size 129139681
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:935c8a7654c307c1b6cdf68d6b6686f70eaa04b2bde08c15ebaa1427bda51601
3
  size 129139681