cfierro commited on
Commit
0f7dfab
·
verified ·
1 Parent(s): 0f1df42

Add attn knockout, now including last_subj_token

Browse files
Files changed (22) hide show
  1. attn_knockout/facebook__xglm-7.5B/ar_subset_resample_trivial_window=6/args.json +12 -0
  2. attn_knockout/facebook__xglm-7.5B/ar_subset_resample_trivial_window=6/results.csv +3 -0
  3. attn_knockout/facebook__xglm-7.5B/en_subset_resample_trivial_window=6/args.json +12 -0
  4. attn_knockout/facebook__xglm-7.5B/en_subset_resample_trivial_window=6/results.csv +3 -0
  5. attn_knockout/facebook__xglm-7.5B/es_subset_resample_trivial_window=6/args.json +12 -0
  6. attn_knockout/facebook__xglm-7.5B/es_subset_resample_trivial_window=6/results.csv +3 -0
  7. attn_knockout/facebook__xglm-7.5B/fa_subset_resample_trivial_window=6/args.json +12 -0
  8. attn_knockout/facebook__xglm-7.5B/fa_subset_resample_trivial_window=6/results.csv +0 -0
  9. attn_knockout/facebook__xglm-7.5B/he_subset_resample_trivial_window=6/args.json +12 -0
  10. attn_knockout/facebook__xglm-7.5B/he_subset_resample_trivial_window=6/results.csv +0 -0
  11. attn_knockout/facebook__xglm-7.5B/ja_subset_resample_trivial_window=6/args.json +12 -0
  12. attn_knockout/facebook__xglm-7.5B/ja_subset_resample_trivial_window=6/results.csv +0 -0
  13. attn_knockout/facebook__xglm-7.5B/ko_subset_resample_trivial_window=6/args.json +12 -0
  14. attn_knockout/facebook__xglm-7.5B/ko_subset_resample_trivial_window=6/results.csv +0 -0
  15. attn_knockout/facebook__xglm-7.5B/ru_subset_resample_trivial_window=6/args.json +12 -0
  16. attn_knockout/facebook__xglm-7.5B/ru_subset_resample_trivial_window=6/results.csv +3 -0
  17. attn_knockout/facebook__xglm-7.5B/tr_subset_resample_trivial_window=6/args.json +12 -0
  18. attn_knockout/facebook__xglm-7.5B/tr_subset_resample_trivial_window=6/results.csv +0 -0
  19. attn_knockout/facebook__xglm-7.5B/uk_subset_resample_trivial_window=6/args.json +12 -0
  20. attn_knockout/facebook__xglm-7.5B/uk_subset_resample_trivial_window=6/results.csv +0 -0
  21. attn_knockout/facebook__xglm-7.5B/vi_subset_resample_trivial_window=6/args.json +12 -0
  22. attn_knockout/facebook__xglm-7.5B/vi_subset_resample_trivial_window=6/results.csv +3 -0
attn_knockout/facebook__xglm-7.5B/ar_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "ar",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/ar_subset_resample_trivial_window=6/results.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67793a7370f5cb51dfd640b5b48a64f8b06810924f082394d1f725fad33697db
3
+ size 15857234
attn_knockout/facebook__xglm-7.5B/en_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "en",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/en_subset_resample_trivial_window=6/results.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:642c065f15bb506a66d66d508aa0718ee265e88307a066255dffda36645355dd
3
+ size 17064336
attn_knockout/facebook__xglm-7.5B/es_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "es",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/es_subset_resample_trivial_window=6/results.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:610c8fb2f9657abf59e8eb86dbc9878f844aabee4ae58a5a7db7f8fb187be315
3
+ size 17196429
attn_knockout/facebook__xglm-7.5B/fa_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "fa",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/fa_subset_resample_trivial_window=6/results.csv ADDED
The diff for this file is too large to render. See raw diff
 
attn_knockout/facebook__xglm-7.5B/he_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "he",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/he_subset_resample_trivial_window=6/results.csv ADDED
The diff for this file is too large to render. See raw diff
 
attn_knockout/facebook__xglm-7.5B/ja_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "ja",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/ja_subset_resample_trivial_window=6/results.csv ADDED
The diff for this file is too large to render. See raw diff
 
attn_knockout/facebook__xglm-7.5B/ko_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "ko",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/ko_subset_resample_trivial_window=6/results.csv ADDED
The diff for this file is too large to render. See raw diff
 
attn_knockout/facebook__xglm-7.5B/ru_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "ru",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/ru_subset_resample_trivial_window=6/results.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194b10a2fa7b6423492c1eb539b48d5411d6227a619df77d7ab94226f5fcf8ff
3
+ size 17127120
attn_knockout/facebook__xglm-7.5B/tr_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "tr",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/tr_subset_resample_trivial_window=6/results.csv ADDED
The diff for this file is too large to render. See raw diff
 
attn_knockout/facebook__xglm-7.5B/uk_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "uk",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/uk_subset_resample_trivial_window=6/results.csv ADDED
The diff for this file is too large to render. See raw diff
 
attn_knockout/facebook__xglm-7.5B/vi_subset_resample_trivial_window=6/args.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name_or_path": "facebook/xglm-7.5B",
3
+ "model_name": "facebook__xglm-7.5B",
4
+ "output_folder": "/projects/nlp/data/constanzam/cross_fact/attn_knockout",
5
+ "eval_dir": "/projects/nlp/data/constanzam/cross_fact/eval/",
6
+ "language": "vi",
7
+ "only_subset": true,
8
+ "filter_trivial": true,
9
+ "keep_only_trivial": false,
10
+ "resample_trivial": true,
11
+ "patch_k_layers": 6
12
+ }
attn_knockout/facebook__xglm-7.5B/vi_subset_resample_trivial_window=6/results.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:052506116b5c66a4726bc8ffb5c27a7b65cb68356fa199187e5293e184e16fb6
3
+ size 18125907