Tristan commited on
Commit
a3531be
1 Parent(s): 00471ba

Training in progress, epoch 0

Browse files
eval_job_output.txt CHANGED
@@ -1,4 +1,4 @@
1
- slurm submission log: 2024-05-19 09:14:44.387762
2
  created following sbatch script:
3
 
4
  ###############################
@@ -7,13 +7,13 @@ created following sbatch script:
7
 
8
  #SBATCH --account=nlp
9
  #SBATCH --cpus-per-task=16
10
- #SBATCH --dependency=afterok:7631097
11
  #SBATCH --gres=gpu:1
12
- #SBATCH --job-name=tthrush-job-3081790
13
  #SBATCH --mem=60G
14
  #SBATCH --nodelist=sphinx2
15
  #SBATCH --open-mode=append
16
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
17
  #SBATCH --partition=sphinx
18
  #SBATCH --time=14-0
19
 
@@ -24,7 +24,7 @@ created following sbatch script:
24
  cd .
25
 
26
  # launch commands
27
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
28
 
29
  ###############################
30
 
@@ -34,13 +34,13 @@ submission to slurm complete!
34
  ###############################
35
  slurm submission output
36
 
37
- Submitted batch job 7631098
38
 
39
 
40
 
41
  ###############################
42
 
43
- slurm submission log: 2024-05-19 09:16:23.491506
44
  created following sbatch script:
45
 
46
  ###############################
@@ -49,13 +49,13 @@ created following sbatch script:
49
 
50
  #SBATCH --account=nlp
51
  #SBATCH --cpus-per-task=16
52
- #SBATCH --dependency=afterok:7631158
53
  #SBATCH --gres=gpu:1
54
- #SBATCH --job-name=tthrush-job-1709178
55
  #SBATCH --mem=60G
56
  #SBATCH --nodelist=sphinx2
57
  #SBATCH --open-mode=append
58
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
59
  #SBATCH --partition=sphinx
60
  #SBATCH --time=14-0
61
 
@@ -66,7 +66,7 @@ created following sbatch script:
66
  cd .
67
 
68
  # launch commands
69
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
70
 
71
  ###############################
72
 
@@ -76,13 +76,13 @@ submission to slurm complete!
76
  ###############################
77
  slurm submission output
78
 
79
- Submitted batch job 7631159
80
 
81
 
82
 
83
  ###############################
84
 
85
- slurm submission log: 2024-05-19 09:25:10.468510
86
  created following sbatch script:
87
 
88
  ###############################
@@ -91,13 +91,13 @@ created following sbatch script:
91
 
92
  #SBATCH --account=nlp
93
  #SBATCH --cpus-per-task=16
94
- #SBATCH --dependency=afterok:7631229
95
  #SBATCH --gres=gpu:1
96
- #SBATCH --job-name=tthrush-job-2260508
97
  #SBATCH --mem=60G
98
  #SBATCH --nodelist=sphinx2
99
  #SBATCH --open-mode=append
100
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
101
  #SBATCH --partition=sphinx
102
  #SBATCH --time=14-0
103
 
@@ -108,7 +108,7 @@ created following sbatch script:
108
  cd .
109
 
110
  # launch commands
111
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
112
 
113
  ###############################
114
 
@@ -118,13 +118,13 @@ submission to slurm complete!
118
  ###############################
119
  slurm submission output
120
 
121
- Submitted batch job 7631230
122
 
123
 
124
 
125
  ###############################
126
 
127
- slurm submission log: 2024-05-19 09:27:23.684328
128
  created following sbatch script:
129
 
130
  ###############################
@@ -133,13 +133,13 @@ created following sbatch script:
133
 
134
  #SBATCH --account=nlp
135
  #SBATCH --cpus-per-task=16
136
- #SBATCH --dependency=afterok:7631292
137
  #SBATCH --gres=gpu:1
138
- #SBATCH --job-name=tthrush-job-304472
139
  #SBATCH --mem=60G
140
  #SBATCH --nodelist=sphinx2
141
  #SBATCH --open-mode=append
142
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
143
  #SBATCH --partition=sphinx
144
  #SBATCH --time=14-0
145
 
@@ -150,7 +150,7 @@ created following sbatch script:
150
  cd .
151
 
152
  # launch commands
153
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
154
 
155
  ###############################
156
 
@@ -160,13 +160,13 @@ submission to slurm complete!
160
  ###############################
161
  slurm submission output
162
 
163
- Submitted batch job 7631293
164
 
165
 
166
 
167
  ###############################
168
 
169
- slurm submission log: 2024-05-19 09:28:20.203824
170
  created following sbatch script:
171
 
172
  ###############################
@@ -175,13 +175,13 @@ created following sbatch script:
175
 
176
  #SBATCH --account=nlp
177
  #SBATCH --cpus-per-task=16
178
- #SBATCH --dependency=afterok:7631356
179
  #SBATCH --gres=gpu:1
180
- #SBATCH --job-name=tthrush-job-107557
181
  #SBATCH --mem=60G
182
  #SBATCH --nodelist=sphinx2
183
  #SBATCH --open-mode=append
184
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
185
  #SBATCH --partition=sphinx
186
  #SBATCH --time=14-0
187
 
@@ -192,7 +192,7 @@ created following sbatch script:
192
  cd .
193
 
194
  # launch commands
195
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
196
 
197
  ###############################
198
 
@@ -202,13 +202,13 @@ submission to slurm complete!
202
  ###############################
203
  slurm submission output
204
 
205
- Submitted batch job 7631357
206
 
207
 
208
 
209
  ###############################
210
 
211
- slurm submission log: 2024-05-19 09:29:23.083307
212
  created following sbatch script:
213
 
214
  ###############################
@@ -217,13 +217,13 @@ created following sbatch script:
217
 
218
  #SBATCH --account=nlp
219
  #SBATCH --cpus-per-task=16
220
- #SBATCH --dependency=afterok:7631417
221
  #SBATCH --gres=gpu:1
222
- #SBATCH --job-name=tthrush-job-2909862
223
  #SBATCH --mem=60G
224
  #SBATCH --nodelist=sphinx2
225
  #SBATCH --open-mode=append
226
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
227
  #SBATCH --partition=sphinx
228
  #SBATCH --time=14-0
229
 
@@ -234,7 +234,7 @@ created following sbatch script:
234
  cd .
235
 
236
  # launch commands
237
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
238
 
239
  ###############################
240
 
@@ -244,13 +244,13 @@ submission to slurm complete!
244
  ###############################
245
  slurm submission output
246
 
247
- Submitted batch job 7631418
248
 
249
 
250
 
251
  ###############################
252
 
253
- slurm submission log: 2024-05-19 09:30:37.406226
254
  created following sbatch script:
255
 
256
  ###############################
@@ -259,13 +259,13 @@ created following sbatch script:
259
 
260
  #SBATCH --account=nlp
261
  #SBATCH --cpus-per-task=16
262
- #SBATCH --dependency=afterok:7631477
263
  #SBATCH --gres=gpu:1
264
- #SBATCH --job-name=tthrush-job-4866433
265
  #SBATCH --mem=60G
266
  #SBATCH --nodelist=sphinx2
267
  #SBATCH --open-mode=append
268
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
269
  #SBATCH --partition=sphinx
270
  #SBATCH --time=14-0
271
 
@@ -276,7 +276,7 @@ created following sbatch script:
276
  cd .
277
 
278
  # launch commands
279
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
280
 
281
  ###############################
282
 
@@ -286,13 +286,13 @@ submission to slurm complete!
286
  ###############################
287
  slurm submission output
288
 
289
- Submitted batch job 7631478
290
 
291
 
292
 
293
  ###############################
294
 
295
- slurm submission log: 2024-05-19 09:31:43.783202
296
  created following sbatch script:
297
 
298
  ###############################
@@ -301,13 +301,13 @@ created following sbatch script:
301
 
302
  #SBATCH --account=nlp
303
  #SBATCH --cpus-per-task=16
304
- #SBATCH --dependency=afterok:7631537
305
  #SBATCH --gres=gpu:1
306
- #SBATCH --job-name=tthrush-job-114836
307
  #SBATCH --mem=60G
308
  #SBATCH --nodelist=sphinx2
309
  #SBATCH --open-mode=append
310
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
311
  #SBATCH --partition=sphinx
312
  #SBATCH --time=14-0
313
 
@@ -318,7 +318,7 @@ created following sbatch script:
318
  cd .
319
 
320
  # launch commands
321
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
322
 
323
  ###############################
324
 
@@ -328,13 +328,13 @@ submission to slurm complete!
328
  ###############################
329
  slurm submission output
330
 
331
- Submitted batch job 7631538
332
 
333
 
334
 
335
  ###############################
336
 
337
- slurm submission log: 2024-05-19 09:34:35.667426
338
  created following sbatch script:
339
 
340
  ###############################
@@ -343,13 +343,13 @@ created following sbatch script:
343
 
344
  #SBATCH --account=nlp
345
  #SBATCH --cpus-per-task=16
346
- #SBATCH --dependency=afterok:7631601
347
  #SBATCH --gres=gpu:1
348
- #SBATCH --job-name=tthrush-job-1198993
349
  #SBATCH --mem=60G
350
  #SBATCH --nodelist=sphinx2
351
  #SBATCH --open-mode=append
352
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
353
  #SBATCH --partition=sphinx
354
  #SBATCH --time=14-0
355
 
@@ -360,7 +360,7 @@ created following sbatch script:
360
  cd .
361
 
362
  # launch commands
363
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
364
 
365
  ###############################
366
 
@@ -370,13 +370,13 @@ submission to slurm complete!
370
  ###############################
371
  slurm submission output
372
 
373
- Submitted batch job 7631602
374
 
375
 
376
 
377
  ###############################
378
 
379
- slurm submission log: 2024-05-19 09:45:22.891907
380
  created following sbatch script:
381
 
382
  ###############################
@@ -385,13 +385,13 @@ created following sbatch script:
385
 
386
  #SBATCH --account=nlp
387
  #SBATCH --cpus-per-task=16
388
- #SBATCH --dependency=afterok:7631671
389
  #SBATCH --gres=gpu:1
390
- #SBATCH --job-name=tthrush-job-1044352
391
  #SBATCH --mem=60G
392
  #SBATCH --nodelist=sphinx1
393
  #SBATCH --open-mode=append
394
- #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/eval_job_output.txt
395
  #SBATCH --partition=sphinx
396
  #SBATCH --time=14-0
397
 
@@ -402,7 +402,7 @@ created following sbatch script:
402
  cd .
403
 
404
  # launch commands
405
- srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_5/perf'
406
 
407
  ###############################
408
 
@@ -412,7 +412,7 @@ submission to slurm complete!
412
  ###############################
413
  slurm submission output
414
 
415
- Submitted batch job 7631672
416
 
417
 
418
 
 
1
+ slurm submission log: 2024-05-19 09:14:43.766078
2
  created following sbatch script:
3
 
4
  ###############################
 
7
 
8
  #SBATCH --account=nlp
9
  #SBATCH --cpus-per-task=16
10
+ #SBATCH --dependency=afterok:7631095
11
  #SBATCH --gres=gpu:1
12
+ #SBATCH --job-name=tthrush-job-778997
13
  #SBATCH --mem=60G
14
  #SBATCH --nodelist=sphinx2
15
  #SBATCH --open-mode=append
16
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
17
  #SBATCH --partition=sphinx
18
  #SBATCH --time=14-0
19
 
 
24
  cd .
25
 
26
  # launch commands
27
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
28
 
29
  ###############################
30
 
 
34
  ###############################
35
  slurm submission output
36
 
37
+ Submitted batch job 7631096
38
 
39
 
40
 
41
  ###############################
42
 
43
+ slurm submission log: 2024-05-19 09:16:22.850586
44
  created following sbatch script:
45
 
46
  ###############################
 
49
 
50
  #SBATCH --account=nlp
51
  #SBATCH --cpus-per-task=16
52
+ #SBATCH --dependency=afterok:7631156
53
  #SBATCH --gres=gpu:1
54
+ #SBATCH --job-name=tthrush-job-725929
55
  #SBATCH --mem=60G
56
  #SBATCH --nodelist=sphinx2
57
  #SBATCH --open-mode=append
58
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
59
  #SBATCH --partition=sphinx
60
  #SBATCH --time=14-0
61
 
 
66
  cd .
67
 
68
  # launch commands
69
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
70
 
71
  ###############################
72
 
 
76
  ###############################
77
  slurm submission output
78
 
79
+ Submitted batch job 7631157
80
 
81
 
82
 
83
  ###############################
84
 
85
+ slurm submission log: 2024-05-19 09:25:09.971960
86
  created following sbatch script:
87
 
88
  ###############################
 
91
 
92
  #SBATCH --account=nlp
93
  #SBATCH --cpus-per-task=16
94
+ #SBATCH --dependency=afterok:7631227
95
  #SBATCH --gres=gpu:1
96
+ #SBATCH --job-name=tthrush-job-2124841
97
  #SBATCH --mem=60G
98
  #SBATCH --nodelist=sphinx2
99
  #SBATCH --open-mode=append
100
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
101
  #SBATCH --partition=sphinx
102
  #SBATCH --time=14-0
103
 
 
108
  cd .
109
 
110
  # launch commands
111
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
112
 
113
  ###############################
114
 
 
118
  ###############################
119
  slurm submission output
120
 
121
+ Submitted batch job 7631228
122
 
123
 
124
 
125
  ###############################
126
 
127
+ slurm submission log: 2024-05-19 09:27:23.099613
128
  created following sbatch script:
129
 
130
  ###############################
 
133
 
134
  #SBATCH --account=nlp
135
  #SBATCH --cpus-per-task=16
136
+ #SBATCH --dependency=afterok:7631290
137
  #SBATCH --gres=gpu:1
138
+ #SBATCH --job-name=tthrush-job-3977677
139
  #SBATCH --mem=60G
140
  #SBATCH --nodelist=sphinx2
141
  #SBATCH --open-mode=append
142
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
143
  #SBATCH --partition=sphinx
144
  #SBATCH --time=14-0
145
 
 
150
  cd .
151
 
152
  # launch commands
153
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
154
 
155
  ###############################
156
 
 
160
  ###############################
161
  slurm submission output
162
 
163
+ Submitted batch job 7631291
164
 
165
 
166
 
167
  ###############################
168
 
169
+ slurm submission log: 2024-05-19 09:28:19.702866
170
  created following sbatch script:
171
 
172
  ###############################
 
175
 
176
  #SBATCH --account=nlp
177
  #SBATCH --cpus-per-task=16
178
+ #SBATCH --dependency=afterok:7631354
179
  #SBATCH --gres=gpu:1
180
+ #SBATCH --job-name=tthrush-job-2200551
181
  #SBATCH --mem=60G
182
  #SBATCH --nodelist=sphinx2
183
  #SBATCH --open-mode=append
184
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
185
  #SBATCH --partition=sphinx
186
  #SBATCH --time=14-0
187
 
 
192
  cd .
193
 
194
  # launch commands
195
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
196
 
197
  ###############################
198
 
 
202
  ###############################
203
  slurm submission output
204
 
205
+ Submitted batch job 7631355
206
 
207
 
208
 
209
  ###############################
210
 
211
+ slurm submission log: 2024-05-19 09:29:22.474916
212
  created following sbatch script:
213
 
214
  ###############################
 
217
 
218
  #SBATCH --account=nlp
219
  #SBATCH --cpus-per-task=16
220
+ #SBATCH --dependency=afterok:7631415
221
  #SBATCH --gres=gpu:1
222
+ #SBATCH --job-name=tthrush-job-927768
223
  #SBATCH --mem=60G
224
  #SBATCH --nodelist=sphinx2
225
  #SBATCH --open-mode=append
226
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
227
  #SBATCH --partition=sphinx
228
  #SBATCH --time=14-0
229
 
 
234
  cd .
235
 
236
  # launch commands
237
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
238
 
239
  ###############################
240
 
 
244
  ###############################
245
  slurm submission output
246
 
247
+ Submitted batch job 7631416
248
 
249
 
250
 
251
  ###############################
252
 
253
+ slurm submission log: 2024-05-19 09:30:36.859049
254
  created following sbatch script:
255
 
256
  ###############################
 
259
 
260
  #SBATCH --account=nlp
261
  #SBATCH --cpus-per-task=16
262
+ #SBATCH --dependency=afterok:7631475
263
  #SBATCH --gres=gpu:1
264
+ #SBATCH --job-name=tthrush-job-3488091
265
  #SBATCH --mem=60G
266
  #SBATCH --nodelist=sphinx2
267
  #SBATCH --open-mode=append
268
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
269
  #SBATCH --partition=sphinx
270
  #SBATCH --time=14-0
271
 
 
276
  cd .
277
 
278
  # launch commands
279
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
280
 
281
  ###############################
282
 
 
286
  ###############################
287
  slurm submission output
288
 
289
+ Submitted batch job 7631476
290
 
291
 
292
 
293
  ###############################
294
 
295
+ slurm submission log: 2024-05-19 09:31:43.176565
296
  created following sbatch script:
297
 
298
  ###############################
 
301
 
302
  #SBATCH --account=nlp
303
  #SBATCH --cpus-per-task=16
304
+ #SBATCH --dependency=afterok:7631535
305
  #SBATCH --gres=gpu:1
306
+ #SBATCH --job-name=tthrush-job-3499676
307
  #SBATCH --mem=60G
308
  #SBATCH --nodelist=sphinx2
309
  #SBATCH --open-mode=append
310
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
311
  #SBATCH --partition=sphinx
312
  #SBATCH --time=14-0
313
 
 
318
  cd .
319
 
320
  # launch commands
321
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
322
 
323
  ###############################
324
 
 
328
  ###############################
329
  slurm submission output
330
 
331
+ Submitted batch job 7631536
332
 
333
 
334
 
335
  ###############################
336
 
337
+ slurm submission log: 2024-05-19 09:34:35.056719
338
  created following sbatch script:
339
 
340
  ###############################
 
343
 
344
  #SBATCH --account=nlp
345
  #SBATCH --cpus-per-task=16
346
+ #SBATCH --dependency=afterok:7631599
347
  #SBATCH --gres=gpu:1
348
+ #SBATCH --job-name=tthrush-job-1235758
349
  #SBATCH --mem=60G
350
  #SBATCH --nodelist=sphinx2
351
  #SBATCH --open-mode=append
352
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
353
  #SBATCH --partition=sphinx
354
  #SBATCH --time=14-0
355
 
 
360
  cd .
361
 
362
  # launch commands
363
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
364
 
365
  ###############################
366
 
 
370
  ###############################
371
  slurm submission output
372
 
373
+ Submitted batch job 7631600
374
 
375
 
376
 
377
  ###############################
378
 
379
+ slurm submission log: 2024-05-19 09:45:22.363194
380
  created following sbatch script:
381
 
382
  ###############################
 
385
 
386
  #SBATCH --account=nlp
387
  #SBATCH --cpus-per-task=16
388
+ #SBATCH --dependency=afterok:7631669
389
  #SBATCH --gres=gpu:1
390
+ #SBATCH --job-name=tthrush-job-4329745
391
  #SBATCH --mem=60G
392
  #SBATCH --nodelist=sphinx1
393
  #SBATCH --open-mode=append
394
+ #SBATCH --output=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/eval_job_output.txt
395
  #SBATCH --partition=sphinx
396
  #SBATCH --time=14-0
397
 
 
402
  cd .
403
 
404
  # launch commands
405
+ srun --unbuffered run_as_child_processes 'lm_eval --model hf --model_args pretrained=/juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4,revision=main,dtype=float16,trust_remote_code=True --tasks xnli_en,xnli_fr,sciq,piqa,lambada,arc_easy --device cuda --output_path /juice5/scr5/tthrush/pretraining-coreset-selection/llm_pretraining/14m_llm_seeds_more_data/pythia-14m_piqa_4/perf'
406
 
407
  ###############################
408
 
 
412
  ###############################
413
  slurm submission output
414
 
415
+ Submitted batch job 7631670
416
 
417
 
418
 
logs/events.out.tfevents.1716141245.sphinx2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba36bd1744bcde3ca24befdfd3cc3514cf7040e534d52d7c906c2acd645f2e0b
3
+ size 62915
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a897857375508348f7af40c14b85238a3c613b88f4ddcaa1809bcafc02a580a
3
  size 56279344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d8829ba10143cdefe4f0a0eba804d7a18373fcffa8440c78086dbb1f4e4cdc5
3
  size 56279344
train_job_output.txt CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:050588f4c277de5ea5d273554c360f76ecbf7d42eee9691b280c658c880a1ae5
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5d2281eb87965f61928c88679fa97c14e286fa3aa056ffc92ba156a8fb9d768
3
  size 5176