Bram Vanroy commited on
Commit
e6a7a63
1 Parent(s): 4228cee

add first Tower

Browse files
evals/arc/arc_nl_TowerBase-7B-v0.1.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "arc_nl": {
4
+ "acc": 0.358426005132592,
5
+ "acc_stderr": 0.01403142278327522,
6
+ "acc_norm": 0.3721129170230967,
7
+ "acc_norm_stderr": 0.014143494499252762
8
+ }
9
+ },
10
+ "versions": {
11
+ "arc_nl": 0
12
+ },
13
+ "config": {
14
+ "model": "hf-auto",
15
+ "model_args": "pretrained=Unbabel/TowerBase-7B-v0.1,use_accelerate=True,device_map_option=auto,dtype=auto,load_in_8bit=True",
16
+ "batch_size": 4,
17
+ "device": "cuda",
18
+ "no_cache": false,
19
+ "limit": null,
20
+ "bootstrap_iters": 100000,
21
+ "description_dict": {}
22
+ }
23
+ }
evals/arc/arc_nl_TowerInstruct-7B-v0.1.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "arc_nl": {
4
+ "acc": 0.3900769888793841,
5
+ "acc_stderr": 0.014272210869539614,
6
+ "acc_norm": 0.3943541488451668,
7
+ "acc_norm_stderr": 0.014299839367505047
8
+ }
9
+ },
10
+ "versions": {
11
+ "arc_nl": 0
12
+ },
13
+ "config": {
14
+ "model": "hf-auto",
15
+ "model_args": "pretrained=Unbabel/TowerInstruct-7B-v0.1,use_accelerate=True,device_map_option=auto,dtype=auto,load_in_8bit=True",
16
+ "batch_size": 4,
17
+ "device": "cuda",
18
+ "no_cache": false,
19
+ "limit": null,
20
+ "bootstrap_iters": 100000,
21
+ "description_dict": {}
22
+ }
23
+ }
evals/hellaswag/hellaswag_nl_TowerBase-7B-v0.1.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "hellaswag_nl": {
4
+ "acc": 0.4561252023745278,
5
+ "acc_stderr": 0.005174784023983772,
6
+ "acc_norm": 0.5817593092282785,
7
+ "acc_norm_stderr": 0.005124901694100509
8
+ }
9
+ },
10
+ "versions": {
11
+ "hellaswag_nl": 1
12
+ },
13
+ "config": {
14
+ "model": "hf-auto",
15
+ "model_args": "pretrained=Unbabel/TowerBase-7B-v0.1,use_accelerate=True,device_map_option=auto,dtype=auto,load_in_8bit=True",
16
+ "batch_size": 4,
17
+ "device": "cuda",
18
+ "no_cache": false,
19
+ "limit": null,
20
+ "bootstrap_iters": 100000,
21
+ "description_dict": {}
22
+ }
23
+ }
evals/hellaswag/hellaswag_nl_TowerInstruct-7B-v0.1.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "hellaswag_nl": {
4
+ "acc": 0.471127900701565,
5
+ "acc_stderr": 0.005186154697710561,
6
+ "acc_norm": 0.5960064759848893,
7
+ "acc_norm_stderr": 0.005098159491383791
8
+ }
9
+ },
10
+ "versions": {
11
+ "hellaswag_nl": 1
12
+ },
13
+ "config": {
14
+ "model": "hf-auto",
15
+ "model_args": "pretrained=Unbabel/TowerInstruct-7B-v0.1,use_accelerate=True,device_map_option=auto,dtype=auto,load_in_8bit=True",
16
+ "batch_size": 4,
17
+ "device": "cuda",
18
+ "no_cache": false,
19
+ "limit": null,
20
+ "bootstrap_iters": 100000,
21
+ "description_dict": {}
22
+ }
23
+ }
evals/models.json CHANGED
@@ -143,6 +143,22 @@
143
  "num_parameters": 2779683840,
144
  "quantization": "8-bit"
145
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
146
  "yi-6b": {
147
  "compute_dtype": "auto",
148
  "dutch_coverage": "none",
 
143
  "num_parameters": 2779683840,
144
  "quantization": "8-bit"
145
  },
146
+ "towerbase-7b-v0.1": {
147
+ "compute_dtype": "auto",
148
+ "dutch_coverage": "not-given",
149
+ "model_name": "Unbabel/TowerBase-7B-v0.1",
150
+ "model_type": "not-given",
151
+ "num_parameters": 6738415616,
152
+ "quantization": "8-bit"
153
+ },
154
+ "towerinstruct-7b-v0.1": {
155
+ "compute_dtype": "auto",
156
+ "dutch_coverage": "not-given",
157
+ "model_name": "Unbabel/TowerInstruct-7B-v0.1",
158
+ "model_type": "not-given",
159
+ "num_parameters": 6738472960,
160
+ "quantization": "8-bit"
161
+ },
162
  "yi-6b": {
163
  "compute_dtype": "auto",
164
  "dutch_coverage": "none",
evals/truthfulqa/truthfulqa_nl_TowerBase-7B-v0.1.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "truthfulqa_nl": {
4
+ "mc1": 0.25987261146496815,
5
+ "mc1_stderr": 0.015663018533664023,
6
+ "mc2": 0.409372470832061,
7
+ "mc2_stderr": 0.014507968477947334
8
+ }
9
+ },
10
+ "versions": {
11
+ "truthfulqa_nl": 1
12
+ },
13
+ "config": {
14
+ "model": "hf-auto",
15
+ "model_args": "pretrained=Unbabel/TowerBase-7B-v0.1,use_accelerate=True,device_map_option=auto,dtype=auto,load_in_8bit=True",
16
+ "batch_size": 4,
17
+ "device": "cuda",
18
+ "no_cache": false,
19
+ "limit": null,
20
+ "bootstrap_iters": 100000,
21
+ "description_dict": {}
22
+ }
23
+ }
evals/truthfulqa/truthfulqa_nl_TowerInstruct-7B-v0.1.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "truthfulqa_nl": {
4
+ "mc1": 0.30318471337579617,
5
+ "mc1_stderr": 0.01641551278171108,
6
+ "mc2": 0.4474541407756634,
7
+ "mc2_stderr": 0.01525070581914585
8
+ }
9
+ },
10
+ "versions": {
11
+ "truthfulqa_nl": 1
12
+ },
13
+ "config": {
14
+ "model": "hf-auto",
15
+ "model_args": "pretrained=Unbabel/TowerInstruct-7B-v0.1,use_accelerate=True,device_map_option=auto,dtype=auto,load_in_8bit=True",
16
+ "batch_size": 4,
17
+ "device": "cuda",
18
+ "no_cache": false,
19
+ "limit": null,
20
+ "bootstrap_iters": 100000,
21
+ "description_dict": {}
22
+ }
23
+ }