Tristan commited on
Commit
ffd7d36
1 Parent(s): 0aea66e

Training in progress, epoch 0

Browse files
eval_job_output.txt CHANGED
@@ -1,4 +1,4 @@
1
- slurm submission log: 2024-05-19 09:14:41.870170
2
  created following sbatch script:
3
 
4
  ###############################
@@ -7,13 +7,13 @@ created following sbatch script:
7
 
8
  #SBATCH --account=nlp
9
  #SBATCH --cpus-per-task=16
10
- #SBATCH --dependency=afterok:7631089
11
  #SBATCH --gres=gpu:1
12
- #SBATCH --job-name=tthrush-job-4203243
13
  #SBATCH --mem=60G
14
  #SBATCH --nodelist=sphinx2
15
  #SBATCH --open-mode=append
16
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
17
  #SBATCH --partition=sphinx
18
  #SBATCH --time=14-0
19
 
@@ -24,7 +24,7 @@ created following sbatch script:
24
  cd .
25
 
26
  # launch commands
27
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
28
 
29
  ###############################
30
 
@@ -34,13 +34,13 @@ submission to slurm complete!
34
  ###############################
35
  slurm submission output
36
 
37
- Submitted batch job 7631090
38
 
39
 
40
 
41
  ###############################
42
 
43
- slurm submission log: 2024-05-19 09:16:21.073119
44
  created following sbatch script:
45
 
46
  ###############################
@@ -49,13 +49,13 @@ created following sbatch script:
49
 
50
  #SBATCH --account=nlp
51
  #SBATCH --cpus-per-task=16
52
- #SBATCH --dependency=afterok:7631150
53
  #SBATCH --gres=gpu:1
54
- #SBATCH --job-name=tthrush-job-3010961
55
  #SBATCH --mem=60G
56
  #SBATCH --nodelist=sphinx2
57
  #SBATCH --open-mode=append
58
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
59
  #SBATCH --partition=sphinx
60
  #SBATCH --time=14-0
61
 
@@ -66,7 +66,7 @@ created following sbatch script:
66
  cd .
67
 
68
  # launch commands
69
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
70
 
71
  ###############################
72
 
@@ -76,13 +76,13 @@ submission to slurm complete!
76
  ###############################
77
  slurm submission output
78
 
79
- Submitted batch job 7631151
80
 
81
 
82
 
83
  ###############################
84
 
85
- slurm submission log: 2024-05-19 09:25:08.396129
86
  created following sbatch script:
87
 
88
  ###############################
@@ -91,13 +91,13 @@ created following sbatch script:
91
 
92
  #SBATCH --account=nlp
93
  #SBATCH --cpus-per-task=16
94
- #SBATCH --dependency=afterok:7631221
95
  #SBATCH --gres=gpu:1
96
- #SBATCH --job-name=tthrush-job-4399372
97
  #SBATCH --mem=60G
98
  #SBATCH --nodelist=sphinx2
99
  #SBATCH --open-mode=append
100
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
101
  #SBATCH --partition=sphinx
102
  #SBATCH --time=14-0
103
 
@@ -108,7 +108,7 @@ created following sbatch script:
108
  cd .
109
 
110
  # launch commands
111
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
112
 
113
  ###############################
114
 
@@ -118,13 +118,13 @@ submission to slurm complete!
118
  ###############################
119
  slurm submission output
120
 
121
- Submitted batch job 7631222
122
 
123
 
124
 
125
  ###############################
126
 
127
- slurm submission log: 2024-05-19 09:27:21.404018
128
  created following sbatch script:
129
 
130
  ###############################
@@ -133,13 +133,13 @@ created following sbatch script:
133
 
134
  #SBATCH --account=nlp
135
  #SBATCH --cpus-per-task=16
136
- #SBATCH --dependency=afterok:7631284
137
  #SBATCH --gres=gpu:1
138
- #SBATCH --job-name=tthrush-job-1884627
139
  #SBATCH --mem=60G
140
  #SBATCH --nodelist=sphinx2
141
  #SBATCH --open-mode=append
142
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
143
  #SBATCH --partition=sphinx
144
  #SBATCH --time=14-0
145
 
@@ -150,7 +150,7 @@ created following sbatch script:
150
  cd .
151
 
152
  # launch commands
153
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
154
 
155
  ###############################
156
 
@@ -160,13 +160,13 @@ submission to slurm complete!
160
  ###############################
161
  slurm submission output
162
 
163
- Submitted batch job 7631285
164
 
165
 
166
 
167
  ###############################
168
 
169
- slurm submission log: 2024-05-19 09:28:18.004148
170
  created following sbatch script:
171
 
172
  ###############################
@@ -175,13 +175,13 @@ created following sbatch script:
175
 
176
  #SBATCH --account=nlp
177
  #SBATCH --cpus-per-task=16
178
- #SBATCH --dependency=afterok:7631348
179
  #SBATCH --gres=gpu:1
180
- #SBATCH --job-name=tthrush-job-1636654
181
  #SBATCH --mem=60G
182
  #SBATCH --nodelist=sphinx2
183
  #SBATCH --open-mode=append
184
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
185
  #SBATCH --partition=sphinx
186
  #SBATCH --time=14-0
187
 
@@ -192,7 +192,7 @@ created following sbatch script:
192
  cd .
193
 
194
  # launch commands
195
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
196
 
197
  ###############################
198
 
@@ -202,13 +202,13 @@ submission to slurm complete!
202
  ###############################
203
  slurm submission output
204
 
205
- Submitted batch job 7631349
206
 
207
 
208
 
209
  ###############################
210
 
211
- slurm submission log: 2024-05-19 09:29:20.681949
212
  created following sbatch script:
213
 
214
  ###############################
@@ -217,13 +217,13 @@ created following sbatch script:
217
 
218
  #SBATCH --account=nlp
219
  #SBATCH --cpus-per-task=16
220
- #SBATCH --dependency=afterok:7631409
221
  #SBATCH --gres=gpu:1
222
- #SBATCH --job-name=tthrush-job-2759412
223
  #SBATCH --mem=60G
224
  #SBATCH --nodelist=sphinx2
225
  #SBATCH --open-mode=append
226
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
227
  #SBATCH --partition=sphinx
228
  #SBATCH --time=14-0
229
 
@@ -234,7 +234,7 @@ created following sbatch script:
234
  cd .
235
 
236
  # launch commands
237
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
238
 
239
  ###############################
240
 
@@ -244,13 +244,13 @@ submission to slurm complete!
244
  ###############################
245
  slurm submission output
246
 
247
- Submitted batch job 7631410
248
 
249
 
250
 
251
  ###############################
252
 
253
- slurm submission log: 2024-05-19 09:30:34.292755
254
  created following sbatch script:
255
 
256
  ###############################
@@ -259,13 +259,13 @@ created following sbatch script:
259
 
260
  #SBATCH --account=nlp
261
  #SBATCH --cpus-per-task=16
262
- #SBATCH --dependency=afterok:7631469
263
  #SBATCH --gres=gpu:1
264
- #SBATCH --job-name=tthrush-job-4781467
265
  #SBATCH --mem=60G
266
  #SBATCH --nodelist=sphinx2
267
  #SBATCH --open-mode=append
268
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
269
  #SBATCH --partition=sphinx
270
  #SBATCH --time=14-0
271
 
@@ -276,7 +276,7 @@ created following sbatch script:
276
  cd .
277
 
278
  # launch commands
279
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
280
 
281
  ###############################
282
 
@@ -286,13 +286,13 @@ submission to slurm complete!
286
  ###############################
287
  slurm submission output
288
 
289
- Submitted batch job 7631470
290
 
291
 
292
 
293
  ###############################
294
 
295
- slurm submission log: 2024-05-19 09:31:39.869529
296
  created following sbatch script:
297
 
298
  ###############################
@@ -301,13 +301,13 @@ created following sbatch script:
301
 
302
  #SBATCH --account=nlp
303
  #SBATCH --cpus-per-task=16
304
- #SBATCH --dependency=afterok:7631529
305
  #SBATCH --gres=gpu:1
306
- #SBATCH --job-name=tthrush-job-2913641
307
  #SBATCH --mem=60G
308
  #SBATCH --nodelist=sphinx2
309
  #SBATCH --open-mode=append
310
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
311
  #SBATCH --partition=sphinx
312
  #SBATCH --time=14-0
313
 
@@ -318,7 +318,7 @@ created following sbatch script:
318
  cd .
319
 
320
  # launch commands
321
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
322
 
323
  ###############################
324
 
@@ -328,13 +328,13 @@ submission to slurm complete!
328
  ###############################
329
  slurm submission output
330
 
331
- Submitted batch job 7631530
332
 
333
 
334
 
335
  ###############################
336
 
337
- slurm submission log: 2024-05-19 09:34:33.468022
338
  created following sbatch script:
339
 
340
  ###############################
@@ -343,13 +343,13 @@ created following sbatch script:
343
 
344
  #SBATCH --account=nlp
345
  #SBATCH --cpus-per-task=16
346
- #SBATCH --dependency=afterok:7631593
347
  #SBATCH --gres=gpu:1
348
- #SBATCH --job-name=tthrush-job-2085637
349
  #SBATCH --mem=60G
350
  #SBATCH --nodelist=sphinx2
351
  #SBATCH --open-mode=append
352
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
353
  #SBATCH --partition=sphinx
354
  #SBATCH --time=14-0
355
 
@@ -360,7 +360,7 @@ created following sbatch script:
360
  cd .
361
 
362
  # launch commands
363
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
364
 
365
  ###############################
366
 
@@ -370,13 +370,13 @@ submission to slurm complete!
370
  ###############################
371
  slurm submission output
372
 
373
- Submitted batch job 7631594
374
 
375
 
376
 
377
  ###############################
378
 
379
- slurm submission log: 2024-05-19 09:45:20.755632
380
  created following sbatch script:
381
 
382
  ###############################
@@ -385,13 +385,13 @@ created following sbatch script:
385
 
386
  #SBATCH --account=nlp
387
  #SBATCH --cpus-per-task=16
388
- #SBATCH --dependency=afterok:7631663
389
  #SBATCH --gres=gpu:1
390
- #SBATCH --job-name=tthrush-job-1519057
391
  #SBATCH --mem=60G
392
  #SBATCH --nodelist=sphinx1
393
  #SBATCH --open-mode=append
394
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/eval_job_output.txt
395
  #SBATCH --partition=sphinx
396
  #SBATCH --time=14-0
397
 
@@ -402,7 +402,7 @@ created following sbatch script:
402
  cd .
403
 
404
  # launch commands
405
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_1/perf'
406
 
407
  ###############################
408
 
@@ -412,7 +412,7 @@ submission to slurm complete!
412
  ###############################
413
  slurm submission output
414
 
415
- Submitted batch job 7631664
416
 
417
 
418
 
 
1
+ slurm submission log: 2024-05-19 09:14:42.488664
2
  created following sbatch script:
3
 
4
  ###############################
 
7
 
8
  #SBATCH --account=nlp
9
  #SBATCH --cpus-per-task=16
10
+ #SBATCH --dependency=afterok:7631091
11
  #SBATCH --gres=gpu:1
12
+ #SBATCH --job-name=tthrush-job-2392557
13
  #SBATCH --mem=60G
14
  #SBATCH --nodelist=sphinx2
15
  #SBATCH --open-mode=append
16
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
17
  #SBATCH --partition=sphinx
18
  #SBATCH --time=14-0
19
 
 
24
  cd .
25
 
26
  # launch commands
27
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
28
 
29
  ###############################
30
 
 
34
  ###############################
35
  slurm submission output
36
 
37
+ Submitted batch job 7631092
38
 
39
 
40
 
41
  ###############################
42
 
43
+ slurm submission log: 2024-05-19 09:16:21.652778
44
  created following sbatch script:
45
 
46
  ###############################
 
49
 
50
  #SBATCH --account=nlp
51
  #SBATCH --cpus-per-task=16
52
+ #SBATCH --dependency=afterok:7631152
53
  #SBATCH --gres=gpu:1
54
+ #SBATCH --job-name=tthrush-job-2688925
55
  #SBATCH --mem=60G
56
  #SBATCH --nodelist=sphinx2
57
  #SBATCH --open-mode=append
58
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
59
  #SBATCH --partition=sphinx
60
  #SBATCH --time=14-0
61
 
 
66
  cd .
67
 
68
  # launch commands
69
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
70
 
71
  ###############################
72
 
 
76
  ###############################
77
  slurm submission output
78
 
79
+ Submitted batch job 7631153
80
 
81
 
82
 
83
  ###############################
84
 
85
+ slurm submission log: 2024-05-19 09:25:08.950627
86
  created following sbatch script:
87
 
88
  ###############################
 
91
 
92
  #SBATCH --account=nlp
93
  #SBATCH --cpus-per-task=16
94
+ #SBATCH --dependency=afterok:7631223
95
  #SBATCH --gres=gpu:1
96
+ #SBATCH --job-name=tthrush-job-1036385
97
  #SBATCH --mem=60G
98
  #SBATCH --nodelist=sphinx2
99
  #SBATCH --open-mode=append
100
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
101
  #SBATCH --partition=sphinx
102
  #SBATCH --time=14-0
103
 
 
108
  cd .
109
 
110
  # launch commands
111
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
112
 
113
  ###############################
114
 
 
118
  ###############################
119
  slurm submission output
120
 
121
+ Submitted batch job 7631224
122
 
123
 
124
 
125
  ###############################
126
 
127
+ slurm submission log: 2024-05-19 09:27:21.986519
128
  created following sbatch script:
129
 
130
  ###############################
 
133
 
134
  #SBATCH --account=nlp
135
  #SBATCH --cpus-per-task=16
136
+ #SBATCH --dependency=afterok:7631286
137
  #SBATCH --gres=gpu:1
138
+ #SBATCH --job-name=tthrush-job-2902502
139
  #SBATCH --mem=60G
140
  #SBATCH --nodelist=sphinx2
141
  #SBATCH --open-mode=append
142
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
143
  #SBATCH --partition=sphinx
144
  #SBATCH --time=14-0
145
 
 
150
  cd .
151
 
152
  # launch commands
153
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
154
 
155
  ###############################
156
 
 
160
  ###############################
161
  slurm submission output
162
 
163
+ Submitted batch job 7631287
164
 
165
 
166
 
167
  ###############################
168
 
169
+ slurm submission log: 2024-05-19 09:28:18.563452
170
  created following sbatch script:
171
 
172
  ###############################
 
175
 
176
  #SBATCH --account=nlp
177
  #SBATCH --cpus-per-task=16
178
+ #SBATCH --dependency=afterok:7631350
179
  #SBATCH --gres=gpu:1
180
+ #SBATCH --job-name=tthrush-job-4933727
181
  #SBATCH --mem=60G
182
  #SBATCH --nodelist=sphinx2
183
  #SBATCH --open-mode=append
184
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
185
  #SBATCH --partition=sphinx
186
  #SBATCH --time=14-0
187
 
 
192
  cd .
193
 
194
  # launch commands
195
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
196
 
197
  ###############################
198
 
 
202
  ###############################
203
  slurm submission output
204
 
205
+ Submitted batch job 7631351
206
 
207
 
208
 
209
  ###############################
210
 
211
+ slurm submission log: 2024-05-19 09:29:21.274779
212
  created following sbatch script:
213
 
214
  ###############################
 
217
 
218
  #SBATCH --account=nlp
219
  #SBATCH --cpus-per-task=16
220
+ #SBATCH --dependency=afterok:7631411
221
  #SBATCH --gres=gpu:1
222
+ #SBATCH --job-name=tthrush-job-3698708
223
  #SBATCH --mem=60G
224
  #SBATCH --nodelist=sphinx2
225
  #SBATCH --open-mode=append
226
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
227
  #SBATCH --partition=sphinx
228
  #SBATCH --time=14-0
229
 
 
234
  cd .
235
 
236
  # launch commands
237
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
238
 
239
  ###############################
240
 
 
244
  ###############################
245
  slurm submission output
246
 
247
+ Submitted batch job 7631412
248
 
249
 
250
 
251
  ###############################
252
 
253
+ slurm submission log: 2024-05-19 09:30:35.685306
254
  created following sbatch script:
255
 
256
  ###############################
 
259
 
260
  #SBATCH --account=nlp
261
  #SBATCH --cpus-per-task=16
262
+ #SBATCH --dependency=afterok:7631471
263
  #SBATCH --gres=gpu:1
264
+ #SBATCH --job-name=tthrush-job-2560205
265
  #SBATCH --mem=60G
266
  #SBATCH --nodelist=sphinx2
267
  #SBATCH --open-mode=append
268
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
269
  #SBATCH --partition=sphinx
270
  #SBATCH --time=14-0
271
 
 
276
  cd .
277
 
278
  # launch commands
279
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
280
 
281
  ###############################
282
 
 
286
  ###############################
287
  slurm submission output
288
 
289
+ Submitted batch job 7631472
290
 
291
 
292
 
293
  ###############################
294
 
295
+ slurm submission log: 2024-05-19 09:31:41.306720
296
  created following sbatch script:
297
 
298
  ###############################
 
301
 
302
  #SBATCH --account=nlp
303
  #SBATCH --cpus-per-task=16
304
+ #SBATCH --dependency=afterok:7631531
305
  #SBATCH --gres=gpu:1
306
+ #SBATCH --job-name=tthrush-job-2924713
307
  #SBATCH --mem=60G
308
  #SBATCH --nodelist=sphinx2
309
  #SBATCH --open-mode=append
310
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
311
  #SBATCH --partition=sphinx
312
  #SBATCH --time=14-0
313
 
 
318
  cd .
319
 
320
  # launch commands
321
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
322
 
323
  ###############################
324
 
 
328
  ###############################
329
  slurm submission output
330
 
331
+ Submitted batch job 7631532
332
 
333
 
334
 
335
  ###############################
336
 
337
+ slurm submission log: 2024-05-19 09:34:33.977628
338
  created following sbatch script:
339
 
340
  ###############################
 
343
 
344
  #SBATCH --account=nlp
345
  #SBATCH --cpus-per-task=16
346
+ #SBATCH --dependency=afterok:7631595
347
  #SBATCH --gres=gpu:1
348
+ #SBATCH --job-name=tthrush-job-2674587
349
  #SBATCH --mem=60G
350
  #SBATCH --nodelist=sphinx2
351
  #SBATCH --open-mode=append
352
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
353
  #SBATCH --partition=sphinx
354
  #SBATCH --time=14-0
355
 
 
360
  cd .
361
 
362
  # launch commands
363
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
364
 
365
  ###############################
366
 
 
370
  ###############################
371
  slurm submission output
372
 
373
+ Submitted batch job 7631596
374
 
375
 
376
 
377
  ###############################
378
 
379
+ slurm submission log: 2024-05-19 09:45:21.296491
380
  created following sbatch script:
381
 
382
  ###############################
 
385
 
386
  #SBATCH --account=nlp
387
  #SBATCH --cpus-per-task=16
388
+ #SBATCH --dependency=afterok:7631665
389
  #SBATCH --gres=gpu:1
390
+ #SBATCH --job-name=tthrush-job-1375329
391
  #SBATCH --mem=60G
392
  #SBATCH --nodelist=sphinx1
393
  #SBATCH --open-mode=append
394
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/eval_job_output.txt
395
  #SBATCH --partition=sphinx
396
  #SBATCH --time=14-0
397
 
 
402
  cd .
403
 
404
  # launch commands
405
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_2/perf'
406
 
407
  ###############################
408
 
 
412
  ###############################
413
  slurm submission output
414
 
415
+ Submitted batch job 7631666
416
 
417
 
418
 
logs/events.out.tfevents.1716140425.sphinx2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:118e928fa50d53fde7a574aef616017feb6d08205517463fa679efc22c028537
3
+ size 62915
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3afd047f9e5e4ca187b5da65a2eb8e83ffe8cd36e546c2a2d02bb834f72e0369
3
  size 56279344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46b7bc3e26076df51d109429adeb6ec620e07b96cd90221f2b008c439c6f2172
3
  size 56279344
train_job_output.txt CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2bb7b3dce46a3ed23526d06f496a5d2feb3176cdf51b3c78e887057bddf0e2e
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e103f778fa9e1b73509711af9ac44164adfeb3e4d0e1e2760f8e4eed845ce2c3
3
  size 5176