Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
1d68492
1 Parent(s): 5602ad9

Training in progress, step 350000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f848b004ca69d971cd5024827329eb728808850f3ba285aae6ae2d66c5e9a1ea
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2412ccb8485cd06f014a9d3ba5fd1d0975b7e018d8cff9900e50d917bc1fdf5d
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5bfba4eea74dece360d73bbeb68171b0f24c78184fc1168b69bc18ed84fe5243
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce357ce3d6b529f718a69a4a019a30353262fc7b3a74b394a29c905d74c6bace
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20c5b304cccca8b5844ddfec128e44995bacab68346ff44d01e8476a83259d32
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cf77bfa9438d97e6b94c6d8adb49ea05fe2793189bc403350f9c99c3df0b70f
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a6026e8cbd4826fee12ad344c0bb2e47d863082fccddfed4801c66cbc3305df
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4364109b281ee76bcd1190601f937d3035fb627994056b37c2278ac5b210512f
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:276a39a4e5fc9bbf2fc7156d49a68ce7b2b8c02aa8d52e98747eb94a987f3191
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76fee5dcfb398dec8998f78597ffb2351be755c012a3c680797e842622a89e1a
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e64783857a8ded45f594a9d4d98ef3bd8c1d156f9923bb0bef61858daa470a8e
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe21a6975cd1ab6dcf33bd2f5c91b79d5cc1adb46d481b8d3e4e4d4a9034b6a
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e61c24f771644e6cd7fccf329b7b1a8621bd89eecc91f4043864ce60f81c96b6
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef93f126c2f64dc8d66788d8ad781c47bda9696dee0f2e314ba09dc6f0be1c9e
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.19187014216562,
5
- "global_step": 340000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2522,11 +2522,85 @@
2522
  "eval_samples_per_second": 796.26,
2523
  "eval_steps_per_second": 12.74,
2524
  "step": 340000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2525
  }
2526
  ],
2527
  "max_steps": 1000000,
2528
  "num_train_epochs": 16,
2529
- "total_flos": 2.383405589691059e+22,
2530
  "trial_name": null,
2531
  "trial_params": null
2532
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.344572205170492,
5
+ "global_step": 350000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2522
  "eval_samples_per_second": 796.26,
2523
  "eval_steps_per_second": 12.74,
2524
  "step": 340000
2525
+ },
2526
+ {
2527
+ "epoch": 5.21,
2528
+ "learning_rate": 0.00012001328690714582,
2529
+ "loss": 0.284,
2530
+ "step": 341000
2531
+ },
2532
+ {
2533
+ "epoch": 5.22,
2534
+ "learning_rate": 0.00011982312984759068,
2535
+ "loss": 0.2845,
2536
+ "step": 342000
2537
+ },
2538
+ {
2539
+ "epoch": 5.24,
2540
+ "learning_rate": 0.00011963253728866778,
2541
+ "loss": 0.2841,
2542
+ "step": 343000
2543
+ },
2544
+ {
2545
+ "epoch": 5.25,
2546
+ "learning_rate": 0.00011944151131466675,
2547
+ "loss": 0.284,
2548
+ "step": 344000
2549
+ },
2550
+ {
2551
+ "epoch": 5.27,
2552
+ "learning_rate": 0.00011925005401461709,
2553
+ "loss": 0.2836,
2554
+ "step": 345000
2555
+ },
2556
+ {
2557
+ "epoch": 5.27,
2558
+ "eval_runtime": 1.1037,
2559
+ "eval_samples_per_second": 906.031,
2560
+ "eval_steps_per_second": 14.496,
2561
+ "step": 345000
2562
+ },
2563
+ {
2564
+ "epoch": 5.28,
2565
+ "learning_rate": 0.00011905816748226513,
2566
+ "loss": 0.2834,
2567
+ "step": 346000
2568
+ },
2569
+ {
2570
+ "epoch": 5.3,
2571
+ "learning_rate": 0.00011886585381605125,
2572
+ "loss": 0.2835,
2573
+ "step": 347000
2574
+ },
2575
+ {
2576
+ "epoch": 5.31,
2577
+ "learning_rate": 0.00011867311511908693,
2578
+ "loss": 0.2832,
2579
+ "step": 348000
2580
+ },
2581
+ {
2582
+ "epoch": 5.33,
2583
+ "learning_rate": 0.00011847995349913162,
2584
+ "loss": 0.2828,
2585
+ "step": 349000
2586
+ },
2587
+ {
2588
+ "epoch": 5.34,
2589
+ "learning_rate": 0.00011828637106856989,
2590
+ "loss": 0.2828,
2591
+ "step": 350000
2592
+ },
2593
+ {
2594
+ "epoch": 5.34,
2595
+ "eval_runtime": 1.0295,
2596
+ "eval_samples_per_second": 971.32,
2597
+ "eval_steps_per_second": 15.541,
2598
+ "step": 350000
2599
  }
2600
  ],
2601
  "max_steps": 1000000,
2602
  "num_train_epochs": 16,
2603
+ "total_flos": 2.4535058507214063e+22,
2604
  "trial_name": null,
2605
  "trial_params": null
2606
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5bfba4eea74dece360d73bbeb68171b0f24c78184fc1168b69bc18ed84fe5243
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce357ce3d6b529f718a69a4a019a30353262fc7b3a74b394a29c905d74c6bace
3
  size 449471589