dat
commited on
Commit
β’
3bb7acf
1
Parent(s):
4ac841b
Saving weights and logs of step 300000
Browse files- checkpoint_300000 +3 -0
- events.out.tfevents.1626429561.t1v-n-f5c06ea1-w-0.782479.3.v2 +2 -2
- flax_model.msgpack +1 -1
- wandb/run-20210716_095921-13hxxunp/files/output.log +544 -0
- wandb/run-20210716_095921-13hxxunp/files/wandb-summary.json +1 -1
- wandb/run-20210716_095921-13hxxunp/logs/debug-internal.log +0 -0
- wandb/run-20210716_095921-13hxxunp/run-13hxxunp.wandb +0 -0
checkpoint_300000
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6871ad76b64c25dba81499753fe5d81cb29ae47e0273e2c1d5076aebf9939680
|
3 |
+
size 1530270447
|
events.out.tfevents.1626429561.t1v-n-f5c06ea1-w-0.782479.3.v2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:284e0d9a865e4999c9430beb1ddc24ba9439a4a04b77594e8edd154a89055472
|
3 |
+
size 11281886
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 510090043
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a08bc06de8e2261ead63b6966f3532eeab82b895ad375a7789666478594b6200
|
3 |
size 510090043
|
wandb/run-20210716_095921-13hxxunp/files/output.log
CHANGED
@@ -8236,3 +8236,547 @@ Training...: 70649it [8:14:57, 2.68it/s]βββββββββββββ
|
|
8236 |
|
8237 |
|
8238 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8236 |
|
8237 |
|
8238 |
|
8239 |
+
Training...: 70699it [8:15:17, 2.69it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8240 |
+
|
8241 |
+
|
8242 |
+
|
8243 |
+
|
8244 |
+
|
8245 |
+
Training...: 70749it [8:15:37, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8246 |
+
|
8247 |
+
|
8248 |
+
|
8249 |
+
|
8250 |
+
|
8251 |
+
Training...: 70799it [8:15:57, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8252 |
+
|
8253 |
+
|
8254 |
+
|
8255 |
+
|
8256 |
+
|
8257 |
+
Training...: 70849it [8:16:17, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8258 |
+
|
8259 |
+
|
8260 |
+
|
8261 |
+
|
8262 |
+
|
8263 |
+
Training...: 70899it [8:16:37, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8264 |
+
|
8265 |
+
|
8266 |
+
|
8267 |
+
|
8268 |
+
|
8269 |
+
Training...: 70949it [8:16:57, 2.70it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8270 |
+
|
8271 |
+
|
8272 |
+
|
8273 |
+
|
8274 |
+
|
8275 |
+
Training...: 70999it [8:17:17, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8276 |
+
|
8277 |
+
|
8278 |
+
|
8279 |
+
|
8280 |
+
|
8281 |
+
Training...: 71049it [8:17:37, 2.68it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8282 |
+
|
8283 |
+
|
8284 |
+
|
8285 |
+
|
8286 |
+
|
8287 |
+
Training...: 71099it [8:17:57, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8288 |
+
|
8289 |
+
|
8290 |
+
|
8291 |
+
|
8292 |
+
|
8293 |
+
Training...: 71149it [8:18:17, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8294 |
+
|
8295 |
+
|
8296 |
+
|
8297 |
+
|
8298 |
+
|
8299 |
+
Training...: 71199it [8:18:37, 2.69it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8300 |
+
|
8301 |
+
|
8302 |
+
|
8303 |
+
|
8304 |
+
|
8305 |
+
Training...: 71249it [8:18:57, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8306 |
+
|
8307 |
+
|
8308 |
+
|
8309 |
+
|
8310 |
+
|
8311 |
+
Training...: 71299it [8:19:18, 2.69it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8312 |
+
|
8313 |
+
|
8314 |
+
|
8315 |
+
|
8316 |
+
|
8317 |
+
Training...: 71349it [8:19:38, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8318 |
+
|
8319 |
+
|
8320 |
+
|
8321 |
+
|
8322 |
+
|
8323 |
+
Training...: 71399it [8:19:58, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8324 |
+
|
8325 |
+
|
8326 |
+
|
8327 |
+
|
8328 |
+
|
8329 |
+
Training...: 71449it [8:20:18, 2.70it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8330 |
+
|
8331 |
+
|
8332 |
+
|
8333 |
+
|
8334 |
+
|
8335 |
+
Training...: 71499it [8:20:38, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8336 |
+
|
8337 |
+
|
8338 |
+
|
8339 |
+
|
8340 |
+
|
8341 |
+
Training...: 71549it [8:20:58, 2.70it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8342 |
+
|
8343 |
+
|
8344 |
+
|
8345 |
+
|
8346 |
+
|
8347 |
+
Training...: 71599it [8:21:18, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8348 |
+
|
8349 |
+
|
8350 |
+
|
8351 |
+
|
8352 |
+
|
8353 |
+
Training...: 71649it [8:21:38, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8354 |
+
|
8355 |
+
|
8356 |
+
|
8357 |
+
|
8358 |
+
|
8359 |
+
Training...: 71699it [8:21:58, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8360 |
+
|
8361 |
+
|
8362 |
+
|
8363 |
+
|
8364 |
+
|
8365 |
+
Training...: 71749it [8:22:18, 2.67it/s]βββββββββββββββββοΏ½οΏ½βββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8366 |
+
|
8367 |
+
|
8368 |
+
|
8369 |
+
|
8370 |
+
|
8371 |
+
Training...: 71799it [8:22:38, 2.69it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8372 |
+
|
8373 |
+
|
8374 |
+
|
8375 |
+
|
8376 |
+
|
8377 |
+
Training...: 71849it [8:22:58, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8378 |
+
|
8379 |
+
|
8380 |
+
|
8381 |
+
|
8382 |
+
|
8383 |
+
Training...: 71899it [8:23:18, 2.69it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8384 |
+
|
8385 |
+
|
8386 |
+
|
8387 |
+
|
8388 |
+
|
8389 |
+
Training...: 71949it [8:23:38, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8390 |
+
|
8391 |
+
|
8392 |
+
|
8393 |
+
|
8394 |
+
|
8395 |
+
Training...: 71999it [8:23:58, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8396 |
+
|
8397 |
+
|
8398 |
+
|
8399 |
+
|
8400 |
+
|
8401 |
+
Training...: 72049it [8:24:18, 2.70it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8402 |
+
|
8403 |
+
|
8404 |
+
|
8405 |
+
|
8406 |
+
|
8407 |
+
Training...: 72099it [8:24:38, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8408 |
+
|
8409 |
+
|
8410 |
+
|
8411 |
+
|
8412 |
+
|
8413 |
+
Training...: 72149it [8:24:58, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8414 |
+
|
8415 |
+
|
8416 |
+
|
8417 |
+
|
8418 |
+
|
8419 |
+
Training...: 72199it [8:25:18, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8420 |
+
|
8421 |
+
|
8422 |
+
|
8423 |
+
|
8424 |
+
|
8425 |
+
|
8426 |
+
Training...: 72250it [8:25:51, 4.01s/it]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8427 |
+
|
8428 |
+
|
8429 |
+
|
8430 |
+
|
8431 |
+
|
8432 |
+
Training...: 72304it [8:26:12, 1.39s/it]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8433 |
+
|
8434 |
+
|
8435 |
+
|
8436 |
+
|
8437 |
+
|
8438 |
+
Training...: 72354it [8:26:32, 1.39s/it]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8439 |
+
|
8440 |
+
|
8441 |
+
|
8442 |
+
|
8443 |
+
|
8444 |
+
Training...: 72406it [8:26:52, 1.09it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8445 |
+
|
8446 |
+
|
8447 |
+
|
8448 |
+
|
8449 |
+
|
8450 |
+
Training...: 72456it [8:27:12, 1.09it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8451 |
+
|
8452 |
+
|
8453 |
+
|
8454 |
+
|
8455 |
+
|
8456 |
+
Training...: 72504it [8:27:32, 1.45s/it]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8457 |
+
|
8458 |
+
|
8459 |
+
|
8460 |
+
|
8461 |
+
|
8462 |
+
Training...: 72558it [8:27:52, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8463 |
+
|
8464 |
+
|
8465 |
+
|
8466 |
+
|
8467 |
+
|
8468 |
+
Training...: 72610it [8:28:12, 2.26it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8469 |
+
|
8470 |
+
|
8471 |
+
|
8472 |
+
|
8473 |
+
|
8474 |
+
Training...: 72656it [8:28:32, 1.09it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8475 |
+
|
8476 |
+
|
8477 |
+
|
8478 |
+
|
8479 |
+
|
8480 |
+
Training...: 72706it [8:28:52, 1.09it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8481 |
+
|
8482 |
+
|
8483 |
+
|
8484 |
+
|
8485 |
+
|
8486 |
+
Training...: 72758it [8:29:12, 1.60it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8487 |
+
|
8488 |
+
|
8489 |
+
|
8490 |
+
|
8491 |
+
|
8492 |
+
Training...: 72808it [8:29:32, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8493 |
+
|
8494 |
+
|
8495 |
+
|
8496 |
+
|
8497 |
+
|
8498 |
+
Training...: 72858it [8:29:52, 1.59it/s]βββββββοΏ½οΏ½βββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8499 |
+
|
8500 |
+
|
8501 |
+
|
8502 |
+
|
8503 |
+
|
8504 |
+
Training...: 72908it [8:30:12, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8505 |
+
|
8506 |
+
|
8507 |
+
|
8508 |
+
|
8509 |
+
|
8510 |
+
Training...: 72960it [8:30:33, 2.25it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8511 |
+
|
8512 |
+
|
8513 |
+
|
8514 |
+
|
8515 |
+
|
8516 |
+
Training...: 73010it [8:30:53, 2.25it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8517 |
+
|
8518 |
+
|
8519 |
+
|
8520 |
+
|
8521 |
+
|
8522 |
+
Training...: 73060it [8:31:13, 2.25it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8523 |
+
|
8524 |
+
|
8525 |
+
|
8526 |
+
|
8527 |
+
|
8528 |
+
Training...: 73110it [8:31:33, 2.26it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8529 |
+
|
8530 |
+
|
8531 |
+
|
8532 |
+
|
8533 |
+
|
8534 |
+
Training...: 73154it [8:31:52, 1.39s/it]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8535 |
+
|
8536 |
+
|
8537 |
+
|
8538 |
+
|
8539 |
+
|
8540 |
+
Training...: 73204it [8:32:13, 1.39s/it]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8541 |
+
|
8542 |
+
|
8543 |
+
|
8544 |
+
|
8545 |
+
|
8546 |
+
Training...: 73258it [8:32:33, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8547 |
+
|
8548 |
+
|
8549 |
+
|
8550 |
+
|
8551 |
+
|
8552 |
+
Training...: 73310it [8:32:53, 2.24it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8553 |
+
|
8554 |
+
|
8555 |
+
|
8556 |
+
|
8557 |
+
|
8558 |
+
Training...: 73360it [8:33:13, 2.25it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8559 |
+
|
8560 |
+
|
8561 |
+
|
8562 |
+
|
8563 |
+
|
8564 |
+
Training...: 73410it [8:33:33, 2.26it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8565 |
+
|
8566 |
+
|
8567 |
+
|
8568 |
+
|
8569 |
+
|
8570 |
+
Training...: 73460it [8:33:53, 2.26it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8571 |
+
|
8572 |
+
|
8573 |
+
|
8574 |
+
|
8575 |
+
|
8576 |
+
Training...: 73512it [8:34:13, 3.10it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8577 |
+
|
8578 |
+
|
8579 |
+
|
8580 |
+
|
8581 |
+
Training...: 73564it [8:34:33, 4.16it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8582 |
+
|
8583 |
+
|
8584 |
+
|
8585 |
+
|
8586 |
+
Training...: 73610it [8:34:53, 2.13it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8587 |
+
|
8588 |
+
|
8589 |
+
|
8590 |
+
|
8591 |
+
Training...: 73664it [8:35:13, 4.15it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8592 |
+
|
8593 |
+
|
8594 |
+
|
8595 |
+
|
8596 |
+
|
8597 |
+
Training...: 73706it [8:35:33, 1.09it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8598 |
+
|
8599 |
+
|
8600 |
+
|
8601 |
+
|
8602 |
+
|
8603 |
+
Training...: 73758it [8:35:53, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8604 |
+
|
8605 |
+
|
8606 |
+
|
8607 |
+
|
8608 |
+
|
8609 |
+
Training...: 73808it [8:36:13, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8610 |
+
|
8611 |
+
|
8612 |
+
|
8613 |
+
|
8614 |
+
|
8615 |
+
Training...: 73854it [8:36:33, 1.43s/it]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8616 |
+
|
8617 |
+
|
8618 |
+
|
8619 |
+
|
8620 |
+
|
8621 |
+
Training...: 73910it [8:36:53, 2.26it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8622 |
+
|
8623 |
+
|
8624 |
+
|
8625 |
+
|
8626 |
+
|
8627 |
+
Training...: 73960it [8:37:13, 2.25it/s]οΏ½οΏ½οΏ½ββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8628 |
+
|
8629 |
+
|
8630 |
+
|
8631 |
+
|
8632 |
+
|
8633 |
+
Training...: 74010it [8:37:33, 2.26it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8634 |
+
|
8635 |
+
|
8636 |
+
|
8637 |
+
|
8638 |
+
|
8639 |
+
Training...: 74062it [8:37:54, 3.11it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8640 |
+
|
8641 |
+
|
8642 |
+
|
8643 |
+
|
8644 |
+
|
8645 |
+
Training...: 74106it [8:38:13, 1.09it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8646 |
+
|
8647 |
+
|
8648 |
+
|
8649 |
+
|
8650 |
+
|
8651 |
+
Training...: 74156it [8:38:33, 1.09it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8652 |
+
|
8653 |
+
|
8654 |
+
|
8655 |
+
|
8656 |
+
|
8657 |
+
Training...: 74208it [8:38:54, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8658 |
+
|
8659 |
+
|
8660 |
+
|
8661 |
+
|
8662 |
+
|
8663 |
+
Training...: 74258it [8:39:14, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8664 |
+
|
8665 |
+
|
8666 |
+
|
8667 |
+
|
8668 |
+
|
8669 |
+
Training...: 74308it [8:39:34, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8670 |
+
|
8671 |
+
|
8672 |
+
|
8673 |
+
|
8674 |
+
|
8675 |
+
Training...: 74358it [8:39:54, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8676 |
+
|
8677 |
+
|
8678 |
+
|
8679 |
+
|
8680 |
+
|
8681 |
+
Training...: 74408it [8:40:14, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8682 |
+
|
8683 |
+
|
8684 |
+
|
8685 |
+
|
8686 |
+
|
8687 |
+
Training...: 74460it [8:40:34, 2.26it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8688 |
+
|
8689 |
+
|
8690 |
+
|
8691 |
+
|
8692 |
+
Training...: 74499it [8:40:40, 2.69it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8693 |
+
|
8694 |
+
|
8695 |
+
|
8696 |
+
|
8697 |
+
|
8698 |
+
Training...: 74549it [8:41:00, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8699 |
+
|
8700 |
+
|
8701 |
+
|
8702 |
+
|
8703 |
+
Training...: 74599it [8:41:20, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8704 |
+
|
8705 |
+
|
8706 |
+
|
8707 |
+
|
8708 |
+
|
8709 |
+
Training...: 74664it [8:41:54, 4.16it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8710 |
+
|
8711 |
+
|
8712 |
+
|
8713 |
+
|
8714 |
+
Training...: 74712it [8:42:14, 2.86it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8715 |
+
|
8716 |
+
|
8717 |
+
|
8718 |
+
Training...: 74749it [8:42:20, 2.70it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8719 |
+
|
8720 |
+
|
8721 |
+
|
8722 |
+
|
8723 |
+
|
8724 |
+
|
8725 |
+
Training...: 74808it [8:42:54, 1.59it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8726 |
+
|
8727 |
+
|
8728 |
+
|
8729 |
+
|
8730 |
+
|
8731 |
+
Training...: 74860it [8:43:14, 2.25it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8732 |
+
|
8733 |
+
|
8734 |
+
|
8735 |
+
|
8736 |
+
|
8737 |
+
Training...: 74910it [8:43:34, 2.25it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8738 |
+
|
8739 |
+
|
8740 |
+
|
8741 |
+
|
8742 |
+
Training...: 74949it [8:43:40, 2.67it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8743 |
+
|
8744 |
+
|
8745 |
+
|
8746 |
+
|
8747 |
+
Training...: 74999it [8:44:00, 2.70it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8748 |
+
Training...: 74999it [8:44:14, 2.70it/s]βββββββββββββββββββββββββββββββββββββββββββββββββ| 500/500 [00:59<00:00, 7.91it/s]
|
8749 |
+
|
8750 |
+
|
8751 |
+
|
8752 |
+
|
8753 |
+
|
8754 |
+
|
8755 |
+
|
8756 |
+
|
8757 |
+
|
8758 |
+
|
8759 |
+
|
8760 |
+
|
8761 |
+
|
8762 |
+
|
8763 |
+
|
8764 |
+
|
8765 |
+
|
8766 |
+
|
8767 |
+
|
8768 |
+
|
8769 |
+
|
8770 |
+
|
8771 |
+
|
8772 |
+
|
8773 |
+
|
8774 |
+
|
8775 |
+
|
8776 |
+
|
8777 |
+
|
8778 |
+
|
8779 |
+
tcmalloc: large alloc 2715181056 bytes == 0x41d306000 @ 0x7fe91a70f680 0x7fe91a72fbdd 0x7fe900cc920d 0x7fe900cd7340 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd6e87 0x7fe900cd2bd3 0x7fe900cd31fe 0x504d56 0x56acb6 0x568d9a 0x5f5b33 0x56bc9b 0x5f5956 0x56aadf 0x5f5956 0x56fb87 0x568d9a 0x5f5b33 0x56bc9b 0x568d9a
|
8780 |
+
[18:50:39] - INFO - absl - Saved checkpoint at checkpoint_300000
|
8781 |
+
[18:50:41] - INFO - huggingface_hub.repository - git version 2.25.1
|
8782 |
+
git-lfs/2.9.2 (GitHub; linux amd64; go 1.13.5)
|
wandb/run-20210716_095921-13hxxunp/files/wandb-summary.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"training_step":
|
|
|
1 |
+
{"training_step": 300000, "learning_rate": 2.503942778275814e-05, "train_loss": 1.888529658317566, "_runtime": 31870, "_timestamp": 1626461432, "_step": 1512, "eval_step": 300000, "eval_accuracy": 0.6334131956100464, "eval_loss": 1.8694549798965454}
|
wandb/run-20210716_095921-13hxxunp/logs/debug-internal.log
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
wandb/run-20210716_095921-13hxxunp/run-13hxxunp.wandb
CHANGED
Binary files a/wandb/run-20210716_095921-13hxxunp/run-13hxxunp.wandb and b/wandb/run-20210716_095921-13hxxunp/run-13hxxunp.wandb differ
|
|