nipunsadvilkar commited on
Commit
74af663
1 Parent(s): a407cc8

Saving weights and logs of step 500

Browse files
.gitattributes CHANGED
@@ -14,3 +14,4 @@
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
 
 
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
17
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76d55c57630984430801c3b6d5cc75703bd2a61ef6bb8f9d20f7c6150f2dfbd3
3
  size 498796983
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1f30bd95331d281308f6cb94e74bec0d82ebc06684501d536c8d38952e09abb
3
  size 498796983
run.log CHANGED
@@ -1,4 +1,4 @@
1
- [16:38:48] - INFO - __main__ - Training/evaluation parameters TrainingArguments(
2
  _n_gpu=-1,
3
  adafactor=False,
4
  adam_beta1=0.9,
@@ -34,7 +34,7 @@ local_rank=-1,
34
  log_level=-1,
35
  log_level_replica=-1,
36
  log_on_each_node=True,
37
- logging_dir=./runs/Jul08_16-38-48_t1v-n-112df4a9-w-0,
38
  logging_first_step=False,
39
  logging_steps=500,
40
  logging_strategy=IntervalStrategy.STEPS,
@@ -56,9 +56,9 @@ push_to_hub_model_id=flax-community/roberta-base-mr,
56
  push_to_hub_organization=None,
57
  push_to_hub_token=vdIAyRvCACJNslYtyLHufmNDnUIyknPzUgVDMFiXqJoulvMqjoubonLJzXOJQJczWfRMJumVaMFjGSFVnQAMdswvZkzNIthKrxBeARBXfqnIwjABkKpCbjGEgnkjpjKi,
58
  remove_unused_columns=True,
59
- report_to=[],
60
  resume_from_checkpoint=None,
61
- run_name=./,
62
  save_on_each_node=False,
63
  save_steps=500,
64
  save_strategy=IntervalStrategy.STEPS,
@@ -73,326 +73,183 @@ warmup_ratio=0.0,
73
  warmup_steps=1000,
74
  weight_decay=0.0,
75
  )
76
- [16:38:48] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): s3.amazonaws.com:443
77
- [16:38:48] - DEBUG - urllib3.connectionpool - https://s3.amazonaws.com:443 "HEAD /datasets.huggingface.co/datasets/datasets/oscar/oscar.py HTTP/1.1" 404 0
78
- [16:38:48] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
79
- [16:38:48] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/oscar.py HTTP/1.1" 200 0
80
- [16:38:48] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
81
- [16:38:49] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/dataset_infos.json HTTP/1.1" 200 0
82
- [16:38:49] - WARNING - datasets.builder - Reusing dataset oscar (/home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2)
83
- [16:38:49] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): s3.amazonaws.com:443
84
- [16:38:49] - DEBUG - urllib3.connectionpool - https://s3.amazonaws.com:443 "HEAD /datasets.huggingface.co/datasets/datasets/oscar/oscar.py HTTP/1.1" 404 0
85
- [16:38:49] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
86
- [16:38:49] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/oscar.py HTTP/1.1" 200 0
87
- [16:38:49] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
88
- [16:38:49] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/dataset_infos.json HTTP/1.1" 200 0
89
- [16:38:49] - WARNING - datasets.builder - Reusing dataset oscar (/home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2)
90
- [16:38:49] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): s3.amazonaws.com:443
91
- [16:38:49] - DEBUG - urllib3.connectionpool - https://s3.amazonaws.com:443 "HEAD /datasets.huggingface.co/datasets/datasets/oscar/oscar.py HTTP/1.1" 404 0
92
- [16:38:49] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
93
- [16:38:49] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/oscar.py HTTP/1.1" 200 0
94
- [16:38:49] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
95
- [16:38:49] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/dataset_infos.json HTTP/1.1" 200 0
96
- [16:38:49] - WARNING - datasets.builder - Reusing dataset oscar (/home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2)
97
- [16:38:49] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-0f52086e7b10d7e8.arrow
98
- [16:38:49] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-a39e5f5a5c6c69fc.arrow
99
- [16:38:49] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-e4d3282a2dd50fa0.arrow
100
- [16:38:49] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-b9a3aa9913be3b34.arrow
101
- [16:38:49] - WARNING - __main__ - Unable to display metrics through TensorBoard because the package is not installed: Please run pip install tensorboard to enable.
102
- [16:38:49] - INFO - absl - Starting the local TPU driver.
103
- [16:38:49] - INFO - absl - Unable to initialize backend 'tpu_driver': Not found: Unable to find driver in registry given worker: local://
104
- [16:38:49] - INFO - absl - Unable to initialize backend 'gpu': Not found: Could not find registered platform with name: "cuda". Available platform names are: TPU Host Interpreter
105
  /home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/jax/lib/xla_bridge.py:382: UserWarning: jax.host_count has been renamed to jax.process_count. This alias will eventually be removed; please update your code.
106
  warnings.warn(
107
  /home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/jax/lib/xla_bridge.py:369: UserWarning: jax.host_id has been renamed to jax.process_index. This alias will eventually be removed; please update your code.
108
  warnings.warn(
109
 
110
 
111
-
112
-
113
-
114
-
115
-
116
-
117
-
118
-
119
-
120
-
121
-
122
-
123
-
124
-
125
-
126
-
127
-
128
-
129
-
130
-
131
-
132
-
133
-
134
-
135
-
136
-
137
-
138
-
139
-
140
-
141
-
142
-
143
-
144
-
145
-
146
-
147
-
148
 
149
-
150
-
151
-
152
-
153
-
154
-
155
-
156
-
157
-
158
-
159
-
160
-
161
-
162
-
163
-
164
-
165
-
166
-
167
-
168
-
169
-
170
-
171
-
172
-
173
-
174
-
175
-
176
-
177
-
178
-
179
-
180
-
181
-
182
-
183
-
184
-
185
 
186
-
187
-
188
-
189
-
190
-
191
-
192
-
193
-
194
-
195
-
196
-
197
-
198
-
199
-
200
-
201
-
202
-
203
-
204
-
205
-
206
-
207
-
208
-
209
-
210
-
211
-
212
-
213
-
214
-
215
-
216
-
217
-
218
-
219
-
220
-
221
-
 
222
 
223
-
224
-
225
-
226
-
227
-
228
-
229
-
230
-
231
-
232
-
233
-
234
-
235
-
236
-
237
-
238
-
239
-
240
-
241
 
242
-
243
 
244
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
245
 
 
246
 
 
247
 
248
 
249
 
250
 
251
-
252
 
253
-
254
- [16:40:34] - INFO - huggingface_hub.repository - git version 2.25.1
255
  git-lfs/2.9.2 (GitHub; linux amd64; go 1.13.5)
256
- [16:40:34] - DEBUG - huggingface_hub.repository - [Repository] is a valid git repo
257
 
258
-
259
-
260
-
261
-
262
-
263
-
264
-
265
-
266
-
267
-
268
-
269
-
270
-
271
-
272
-
273
-
274
-
275
-
276
-
277
-
278
-
279
-
280
-
281
-
282
-
283
-
284
-
285
-
286
-
287
-
288
-
289
-
290
-
291
-
292
-
293
-
294
-
295
-
296
-
297
-
298
-
299
-
300
-
301
-
302
-
303
-
304
-
305
-
306
-
307
-
308
-
309
-
310
-
311
-
312
-
313
-
314
-
315
-
316
-
317
-
318
-
319
-
320
-
321
-
322
-
323
-
324
-
325
-
326
-
327
-
328
-
329
-
330
-
331
-
332
-
333
-
334
-
335
-
336
-
337
-
338
-
339
-
340
-
341
-
342
-
343
-
344
-
345
-
346
-
347
-
348
-
349
-
350
-
351
-
352
-
353
-
354
-
355
-
356
-
357
-
358
-
359
-
360
-
361
-
362
-
363
-
364
-
365
-
366
-
367
-
368
-
369
-
370
-
371
-
372
-
373
-
374
-
375
-
376
-
377
-
378
-
379
-
380
-
381
-
382
-
383
-
384
-
385
-
386
-
387
-
388
-
389
-
390
-
391
-
392
-
393
 
394
-
395
 
396
-
397
-
398
-
399
-
400
-
401
-
402
- [16:41:04] - INFO - huggingface_hub.repository - git version 2.25.1
403
- git-lfs/2.9.2 (GitHub; linux amd64; go 1.13.5)
404
- [16:41:04] - DEBUG - huggingface_hub.repository - [Repository] is a valid git repo
 
1
+ [10:39:50] - INFO - __main__ - Training/evaluation parameters TrainingArguments(
2
  _n_gpu=-1,
3
  adafactor=False,
4
  adam_beta1=0.9,
 
34
  log_level=-1,
35
  log_level_replica=-1,
36
  log_on_each_node=True,
37
+ logging_dir=./runs/Jul09_10-39-50_t1v-n-112df4a9-w-0,
38
  logging_first_step=False,
39
  logging_steps=500,
40
  logging_strategy=IntervalStrategy.STEPS,
 
56
  push_to_hub_organization=None,
57
  push_to_hub_token=vdIAyRvCACJNslYtyLHufmNDnUIyknPzUgVDMFiXqJoulvMqjoubonLJzXOJQJczWfRMJumVaMFjGSFVnQAMdswvZkzNIthKrxBeARBXfqnIwjABkKpCbjGEgnkjpjKi,
58
  remove_unused_columns=True,
59
+ report_to=['wandb'],
60
  resume_from_checkpoint=None,
61
+ run_name=hf-flax-robert-base-mr,
62
  save_on_each_node=False,
63
  save_steps=500,
64
  save_strategy=IntervalStrategy.STEPS,
 
73
  warmup_steps=1000,
74
  weight_decay=0.0,
75
  )
76
+ [10:39:50] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): s3.amazonaws.com:443
77
+ [10:39:50] - DEBUG - urllib3.connectionpool - https://s3.amazonaws.com:443 "HEAD /datasets.huggingface.co/datasets/datasets/oscar/oscar.py HTTP/1.1" 404 0
78
+ [10:39:50] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
79
+ [10:39:50] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/oscar.py HTTP/1.1" 200 0
80
+ [10:39:50] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
81
+ [10:39:50] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/dataset_infos.json HTTP/1.1" 200 0
82
+ [10:39:50] - WARNING - datasets.builder - Reusing dataset oscar (/home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2)
83
+ [10:39:50] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): s3.amazonaws.com:443
84
+ [10:39:51] - DEBUG - urllib3.connectionpool - https://s3.amazonaws.com:443 "HEAD /datasets.huggingface.co/datasets/datasets/oscar/oscar.py HTTP/1.1" 404 0
85
+ [10:39:51] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
86
+ [10:39:51] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/oscar.py HTTP/1.1" 200 0
87
+ [10:39:51] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
88
+ [10:39:51] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/dataset_infos.json HTTP/1.1" 200 0
89
+ [10:39:51] - WARNING - datasets.builder - Reusing dataset oscar (/home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2)
90
+ [10:39:51] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): s3.amazonaws.com:443
91
+ [10:39:51] - DEBUG - urllib3.connectionpool - https://s3.amazonaws.com:443 "HEAD /datasets.huggingface.co/datasets/datasets/oscar/oscar.py HTTP/1.1" 404 0
92
+ [10:39:51] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
93
+ [10:39:51] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/oscar.py HTTP/1.1" 200 0
94
+ [10:39:51] - DEBUG - urllib3.connectionpool - Starting new HTTPS connection (1): raw.githubusercontent.com:443
95
+ [10:39:51] - DEBUG - urllib3.connectionpool - https://raw.githubusercontent.com:443 "HEAD /huggingface/datasets/master/datasets/oscar/dataset_infos.json HTTP/1.1" 200 0
96
+ [10:39:51] - WARNING - datasets.builder - Reusing dataset oscar (/home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2)
97
+ [10:39:51] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-0f52086e7b10d7e8.arrow
98
+ [10:39:51] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-a39e5f5a5c6c69fc.arrow
99
+ [10:39:51] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-e4d3282a2dd50fa0.arrow
100
+ [10:39:51] - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/nipunsadvilkar/.cache/huggingface/datasets/oscar/unshuffled_deduplicated_als/1.0.0/84838bd49d2295f62008383b05620571535451d84545037bb94d6f3501651df2/cache-b9a3aa9913be3b34.arrow
101
+ [10:39:51] - INFO - absl - Starting the local TPU driver.
102
+ [10:39:51] - INFO - absl - Unable to initialize backend 'tpu_driver': Not found: Unable to find driver in registry given worker: local://
103
+ [10:39:51] - INFO - absl - Unable to initialize backend 'gpu': Not found: Could not find registered platform with name: "cuda". Available platform names are: Interpreter Host TPU
104
+ [10:39:55] - WARNING - __main__ - Unable to display metrics through TensorBoard because some package are not installed: No module named 'tensorflow'
105
  /home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/jax/lib/xla_bridge.py:382: UserWarning: jax.host_count has been renamed to jax.process_count. This alias will eventually be removed; please update your code.
106
  warnings.warn(
107
  /home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/jax/lib/xla_bridge.py:369: UserWarning: jax.host_id has been renamed to jax.process_index. This alias will eventually be removed; please update your code.
108
  warnings.warn(
109
 
110
 
111
+
112
+
113
+
114
+
115
+
116
+
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+
127
+
128
+
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+
138
+
139
+
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
 
149
+
150
+
151
+
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+
160
+
161
+
162
+
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+
171
+
172
+
173
+
174
+
175
+
176
+
177
+
178
+
179
+
180
+
181
+
182
+
183
+
184
+
185
 
186
+
187
+
188
+
189
+
190
+
191
+
192
+
193
+
194
+
195
+
196
+
197
+
198
+
199
+
200
+
201
+
202
+
203
+
204
+
205
+
206
+
207
+
208
+
209
+
210
+
211
+
212
+
213
+
214
+
215
+
216
+
217
+
218
+
219
+
220
+
221
+
222
+
223
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
224
 
 
225
 
226
+
227
+
228
+
229
+
230
+
231
+
232
+
233
+
234
+
235
+
236
+
237
+
238
+
239
+
240
+
241
+
242
+
243
+
244
 
245
+
246
 
247
+
248
 
249
 
250
 
251
 
252
+
253
 
254
+
255
+ [10:41:35] - INFO - huggingface_hub.repository - git version 2.25.1
256
  git-lfs/2.9.2 (GitHub; linux amd64; go 1.13.5)
257
+ [10:41:35] - DEBUG - huggingface_hub.repository - [Repository] is a valid git repo
258
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
259
 
 
260
 
261
+
 
 
 
 
 
 
 
 
run.sh CHANGED
@@ -13,6 +13,8 @@ python run_mlm_flax.py \
13
  --warmup_steps="1000" \
14
  --overwrite_output_dir \
15
  --num_train_epochs="8" \
 
 
16
  --push_to_hub_model_id="flax-community/roberta-base-mr" \
17
  --push_to_hub_token=$HUB_TOKEN \
18
  --push_to_hub 2>&1 | tee run.log
 
13
  --warmup_steps="1000" \
14
  --overwrite_output_dir \
15
  --num_train_epochs="8" \
16
+ --report_to wandb \
17
+ --run_name hf-flax-robert-base-mr \
18
  --push_to_hub_model_id="flax-community/roberta-base-mr" \
19
  --push_to_hub_token=$HUB_TOKEN \
20
  --push_to_hub 2>&1 | tee run.log
run_mlm_flax.py CHANGED
@@ -457,7 +457,6 @@ if __name__ == "__main__":
457
  if has_tensorboard and jax.process_index() == 0:
458
  try:
459
  from flax.metrics.tensorboard import SummaryWriter
460
-
461
  summary_writer = SummaryWriter(log_dir=Path(training_args.output_dir))
462
  except ImportError as ie:
463
  has_tensorboard = False
 
457
  if has_tensorboard and jax.process_index() == 0:
458
  try:
459
  from flax.metrics.tensorboard import SummaryWriter
 
460
  summary_writer = SummaryWriter(log_dir=Path(training_args.output_dir))
461
  except ImportError as ie:
462
  has_tensorboard = False
wandb/debug-internal.log ADDED
@@ -0,0 +1 @@
 
 
1
+ run-20210709_103433-d7n9baaw/logs/debug-internal.log
wandb/debug.log ADDED
@@ -0,0 +1 @@
 
 
1
+ run-20210709_103433-d7n9baaw/logs/debug.log
wandb/latest-run ADDED
@@ -0,0 +1 @@
 
 
1
+ run-20210709_103433-d7n9baaw
wandb/run-20210709_103433-d7n9baaw/files/config.yaml ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ _wandb:
4
+ desc: null
5
+ value:
6
+ cli_version: 0.10.33
7
+ framework: huggingface
8
+ huggingface_version: 4.9.0.dev0
9
+ is_jupyter_run: false
10
+ is_kaggle_kernel: false
11
+ python_version: 3.8.10
12
+ t:
13
+ 1:
14
+ - 11
15
+ 4: 3.8.10
16
+ 5: 0.10.33
17
+ 6: 4.9.0.dev0
18
+ 8:
19
+ - 5
wandb/run-20210709_103433-d7n9baaw/logs/debug-internal.log ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2021-07-09 10:34:34,450 INFO MainThread:25100 [internal.py:wandb_internal():88] W&B internal server running at pid: 25100, started at: 2021-07-09 10:34:34.449847
2
+ 2021-07-09 10:34:34,452 DEBUG HandlerThread:25100 [handler.py:handle_request():124] handle_request: check_version
3
+ 2021-07-09 10:34:34,452 INFO WriterThread:25100 [datastore.py:open_for_write():80] open: /home/nipunsadvilkar/sample/roberta-base-mr/wandb/run-20210709_103433-d7n9baaw/run-d7n9baaw.wandb
4
+ 2021-07-09 10:34:34,453 DEBUG SenderThread:25100 [sender.py:send():179] send: header
5
+ 2021-07-09 10:34:34,453 DEBUG SenderThread:25100 [sender.py:send_request():193] send_request: check_version
6
+ 2021-07-09 10:34:34,515 DEBUG SenderThread:25100 [sender.py:send():179] send: run
7
+ 2021-07-09 10:34:34,556 ERROR SenderThread:25100 [internal_api.py:execute():130] 403 response executing GraphQL.
8
+ 2021-07-09 10:34:34,556 ERROR SenderThread:25100 [internal_api.py:execute():131] {"errors":[{"message":"permission denied","path":["upsertBucket"],"extensions":{"code":"PERMISSION_ERROR"}}],"data":{"upsertBucket":null}}
9
+ 2021-07-09 10:34:35,516 INFO HandlerThread:25100 [handler.py:finish():638] shutting down handler
10
+ 2021-07-09 10:34:35,517 INFO WriterThread:25100 [datastore.py:close():288] close: /home/nipunsadvilkar/sample/roberta-base-mr/wandb/run-20210709_103433-d7n9baaw/run-d7n9baaw.wandb
11
+ 2021-07-09 10:34:35,517 ERROR MainThread:25100 [internal.py:wandb_internal():159] Thread SenderThread:
12
+ Traceback (most recent call last):
13
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/lib/retry.py", line 102, in __call__
14
+ result = self._call_fn(*args, **kwargs)
15
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/internal_api.py", line 133, in execute
16
+ six.reraise(*sys.exc_info())
17
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/six.py", line 719, in reraise
18
+ raise value
19
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/internal_api.py", line 127, in execute
20
+ return self.client.execute(*args, **kwargs)
21
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/vendor/gql-0.2.0/gql/client.py", line 52, in execute
22
+ result = self._get_result(document, *args, **kwargs)
23
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/vendor/gql-0.2.0/gql/client.py", line 60, in _get_result
24
+ return self.transport.execute(document, *args, **kwargs)
25
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/vendor/gql-0.2.0/gql/transport/requests.py", line 39, in execute
26
+ request.raise_for_status()
27
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/requests/models.py", line 943, in raise_for_status
28
+ raise HTTPError(http_error_msg, response=self)
29
+ requests.exceptions.HTTPError: 403 Client Error: Forbidden for url: https://api.wandb.ai/graphql
30
+
31
+ During handling of the above exception, another exception occurred:
32
+
33
+ Traceback (most recent call last):
34
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/apis/normalize.py", line 24, in wrapper
35
+ return func(*args, **kwargs)
36
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/internal_api.py", line 922, in upsert_run
37
+ response = self.gql(mutation, variable_values=variable_values, **kwargs)
38
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/lib/retry.py", line 118, in __call__
39
+ if not check_retry_fn(e):
40
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/util.py", line 727, in no_retry_auth
41
+ raise CommError("Permission denied, ask the project owner to grant you access")
42
+ wandb.errors.CommError: Permission denied, ask the project owner to grant you access
43
+
44
+ During handling of the above exception, another exception occurred:
45
+
46
+ Traceback (most recent call last):
47
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/internal_util.py", line 55, in run
48
+ self._run()
49
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/internal_util.py", line 105, in _run
50
+ self._process(record)
51
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/internal.py", line 292, in _process
52
+ self._sm.send(record)
53
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/sender.py", line 181, in send
54
+ send_handler(record)
55
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/sender.py", line 604, in send_run
56
+ self._init_run(run, config_value_dict)
57
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/sender.py", line 626, in _init_run
58
+ server_run, inserted = self._api.upsert_run(
59
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/apis/normalize.py", line 62, in wrapper
60
+ six.reraise(CommError, CommError(message, err), sys.exc_info()[2])
61
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/six.py", line 718, in reraise
62
+ raise value.with_traceback(tb)
63
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/apis/normalize.py", line 24, in wrapper
64
+ return func(*args, **kwargs)
65
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/internal/internal_api.py", line 922, in upsert_run
66
+ response = self.gql(mutation, variable_values=variable_values, **kwargs)
67
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/lib/retry.py", line 118, in __call__
68
+ if not check_retry_fn(e):
69
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/util.py", line 727, in no_retry_auth
70
+ raise CommError("Permission denied, ask the project owner to grant you access")
71
+ wandb.errors.CommError: Permission denied, ask the project owner to grant you access
72
+ 2021-07-09 10:34:37,565 INFO MainThread:25100 [internal.py:handle_exit():78] Internal process exited
wandb/run-20210709_103433-d7n9baaw/logs/debug.log ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [wandb_setup.py:_flush():69] setting env: {}
2
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [wandb_setup.py:_flush():69] setting login settings: {}
3
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [wandb_init.py:_log_setup():337] Logging user logs to /home/nipunsadvilkar/sample/roberta-base-mr/wandb/run-20210709_103433-d7n9baaw/logs/debug.log
4
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [wandb_init.py:_log_setup():338] Logging internal logs to /home/nipunsadvilkar/sample/roberta-base-mr/wandb/run-20210709_103433-d7n9baaw/logs/debug-internal.log
5
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [wandb_init.py:init():370] calling init triggers
6
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [wandb_init.py:init():375] wandb.init called with sweep_config: {}
7
+ config: {}
8
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [wandb_init.py:init():419] starting backend
9
+ 2021-07-09 10:34:33,839 INFO MainThread:24042 [backend.py:_multiprocessing_setup():70] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
10
+ 2021-07-09 10:34:33,940 INFO MainThread:24042 [backend.py:ensure_launched():135] starting backend process...
11
+ 2021-07-09 10:34:33,967 INFO MainThread:24042 [backend.py:ensure_launched():139] started backend process with pid: 25100
12
+ 2021-07-09 10:34:33,969 INFO MainThread:24042 [wandb_init.py:init():424] backend started and connected
13
+ 2021-07-09 10:34:33,971 INFO MainThread:24042 [wandb_init.py:init():472] updated telemetry
14
+ 2021-07-09 10:34:33,972 INFO MainThread:24042 [wandb_init.py:init():491] communicating current version
15
+ 2021-07-09 10:34:34,514 INFO MainThread:24042 [wandb_init.py:init():496] got version response
16
+ 2021-07-09 10:34:34,514 INFO MainThread:24042 [wandb_init.py:init():504] communicating run to backend with 30 second timeout
17
+ 2021-07-09 10:34:46,387 WARNING MainThread:24042 [wandb_init.py:init():781] interrupted
18
+ Traceback (most recent call last):
19
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/wandb_init.py", line 761, in init
20
+ run = wi.init()
21
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/wandb_init.py", line 505, in init
22
+ ret = backend.interface.communicate_run(run, timeout=30)
23
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/interface/interface.py", line 667, in communicate_run
24
+ return self._communicate_run(run, timeout=timeout)
25
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/interface/interface.py", line 655, in _communicate_run
26
+ resp = self._communicate(req, timeout=timeout)
27
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/interface/interface.py", line 545, in _communicate
28
+ return self._communicate_async(rec, local=local).get(timeout=timeout)
29
+ File "/home/nipunsadvilkar/roberta_mr_env/lib/python3.8/site-packages/wandb/sdk/interface/interface.py", line 82, in get
30
+ is_set = self._object_ready.wait(timeout)
31
+ File "/usr/lib/python3.8/threading.py", line 558, in wait
32
+ signaled = self._cond.wait(timeout)
33
+ File "/usr/lib/python3.8/threading.py", line 306, in wait
34
+ gotit = waiter.acquire(True, timeout)
35
+ KeyboardInterrupt
wandb/run-20210709_103433-d7n9baaw/run-d7n9baaw.wandb ADDED
Binary file (196 Bytes). View file